aboutsummaryrefslogtreecommitdiffstats
path: root/transcode.c
diff options
context:
space:
mode:
authorakr <akr@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2008-08-25 16:27:23 +0000
committerakr <akr@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2008-08-25 16:27:23 +0000
commit873987f2e0796e04ca0ac0aed885137f8e523338 (patch)
tree460f3dd7af8c73b17de772fbf6a51b55f3e07fae /transcode.c
parent1a805010ed9e9edc99f2abefa5d4431eb54b43f4 (diff)
downloadruby-873987f2e0796e04ca0ac0aed885137f8e523338.tar.gz
* transcode.c (str_transcode0): disable newline conversion for ASCII
incompatible encoding. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@18853 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
Diffstat (limited to 'transcode.c')
-rw-r--r--transcode.c29
1 files changed, 22 insertions, 7 deletions
diff --git a/transcode.c b/transcode.c
index 40db7c71af..8a57054eb2 100644
--- a/transcode.c
+++ b/transcode.c
@@ -1861,7 +1861,7 @@ str_transcode_enc_args(VALUE str, VALUE arg1, VALUE arg2,
}
static int
-str_transcode0(int argc, VALUE *argv, VALUE *self, rb_econv_option_t *ecopts)
+str_transcode0(int argc, VALUE *argv, VALUE *self, rb_econv_option_t *ecopts_arg)
{
VALUE dest;
VALUE str = *self;
@@ -1871,6 +1871,7 @@ str_transcode0(int argc, VALUE *argv, VALUE *self, rb_econv_option_t *ecopts)
rb_encoding *from_enc, *to_enc;
const char *from_e, *to_e;
int to_encidx;
+ rb_econv_option_t ecopts;
if (argc < 1 || argc > 2) {
rb_raise(rb_eArgError, "wrong number of arguments (%d for 1..2)", argc);
@@ -1878,9 +1879,25 @@ str_transcode0(int argc, VALUE *argv, VALUE *self, rb_econv_option_t *ecopts)
to_encidx = str_transcode_enc_args(str, argv[0], argc==1 ? Qnil : argv[1], &from_e, &from_enc, &to_e, &to_enc);
- if ((ecopts->flags & (ECONV_UNIVERSAL_NEWLINE_DECODER|
- ECONV_CRLF_NEWLINE_ENCODER|
- ECONV_CR_NEWLINE_ENCODER)) == 0) {
+ if (ecopts_arg)
+ ecopts = *ecopts_arg;
+ else
+ rb_econv_opts(Qnil, &ecopts);
+
+ /* disable newline conversion for ascii incompatible encoding.
+ * xxx: convert newline in ascii-compatible encoding?
+ * ex. UTF-16BE -> UTF-8 -> newline conversion -> UTF-8 -> UTF-16BE.
+ */
+ if (!from_enc || !rb_enc_asciicompat(from_enc)) {
+ ecopts.flags &= ~(ECONV_CRLF_NEWLINE_ENCODER|ECONV_CR_NEWLINE_ENCODER);
+ }
+ if (!to_enc || !rb_enc_asciicompat(to_enc)) {
+ ecopts.flags &= ~ECONV_UNIVERSAL_NEWLINE_DECODER;
+ }
+
+ if ((ecopts.flags & (ECONV_UNIVERSAL_NEWLINE_DECODER|
+ ECONV_CRLF_NEWLINE_ENCODER|
+ ECONV_CR_NEWLINE_ENCODER)) == 0) {
if (from_enc && from_enc == to_enc) {
return -1;
}
@@ -1895,8 +1912,6 @@ str_transcode0(int argc, VALUE *argv, VALUE *self, rb_econv_option_t *ecopts)
}
else {
if (encoding_equal(from_e, to_e)) {
- /* newline conversion only.
- * xxx: this assumes ascii compatible encoding. */
from_e = "";
to_e = "";
}
@@ -1908,7 +1923,7 @@ str_transcode0(int argc, VALUE *argv, VALUE *self, rb_econv_option_t *ecopts)
dest = rb_str_tmp_new(blen);
bp = (unsigned char *)RSTRING_PTR(dest);
- transcode_loop(&fromp, &bp, (sp+slen), (bp+blen), dest, str_transcoding_resize, from_e, to_e, ecopts);
+ transcode_loop(&fromp, &bp, (sp+slen), (bp+blen), dest, str_transcoding_resize, from_e, to_e, &ecopts);
if (fromp != sp+slen) {
rb_raise(rb_eArgError, "not fully converted, %"PRIdPTRDIFF" bytes left", sp+slen-fromp);
}