All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.jruby.util.io.EncodingUtils Maven / Gradle / Ivy

There is a newer version: 9.4.12.0
Show newest version
package org.jruby.util.io;

import org.jcodings.Encoding;
import org.jruby.Ruby;
import org.jruby.RubyArray;
import org.jruby.RubyEncoding;
import org.jruby.RubyHash;
import org.jruby.RubyNumeric;
import org.jruby.runtime.ThreadContext;
import org.jruby.runtime.builtin.IRubyObject;
import org.jruby.runtime.encoding.EncodingService;
import org.jruby.util.TypeConverter;

public class EncodingUtils {    
    public static Encoding toEncoding(ThreadContext context, IRubyObject object) {
        if (object instanceof RubyEncoding) return ((RubyEncoding) object).getEncoding();
        
        return context.runtime.getEncodingService().getEncodingFromObject(object);
    }
    
    public static IRubyObject[] openArgsToArgs(Ruby runtime, IRubyObject firstElement, RubyHash options) {
        IRubyObject value = hashARef(runtime, options, "open_args");
        
        if (value.isNil()) return new IRubyObject[] { firstElement, options };
        
        RubyArray array = value.convertToArray();
        
        IRubyObject[] openArgs = new IRubyObject[array.size()];
        value.convertToArray().toArray(openArgs);
        IRubyObject[] args = new IRubyObject[openArgs.length + 1];
        
        args[0] = firstElement;
        
        System.arraycopy(openArgs, 0, args, 1, openArgs.length);
        
        return args;
    }

    // FIXME: This could be smarter amount determining whether optionsArg is a RubyHash and !null (invariant)
    // mri: extract_binmode
    public static int extractBinmode(Ruby runtime, IRubyObject optionsArg, int fmode) {
        IRubyObject v = hashARef(runtime, optionsArg, "textmode");
        if (!v.isNil() && v.isTrue()) fmode |= OpenFile.TEXTMODE;
        
        v = hashARef(runtime, optionsArg, "binmode");
        if (!v.isNil() && v.isTrue()) fmode |= OpenFile.BINMODE;

        if ((fmode & OpenFile.BINMODE) != 0 && (fmode & OpenFile.TEXTMODE) != 0) {
            throw runtime.newArgumentError("both textmode and binmode specified");
        }
        
        return fmode;
    }
    
    private static IRubyObject hashARef(Ruby runtime, IRubyObject hash, String symbol) {
        if (hash == null || !(hash instanceof RubyHash)) return runtime.getNil();
        
        IRubyObject value = ((RubyHash) hash).fastARef(runtime.newSymbol(symbol));
        
        return value == null ? runtime.getNil() : value;
    }
    
    public static Encoding ascii8bitEncoding(Ruby runtime) {
        return runtime.getEncodingService().getAscii8bitEncoding();   
    }
    
    public static final int PERM = 0;
    public static final int VMODE = 1;
    
    /*
     * This is a wacky method which is a very near port from MRI.  pm passes in 
     * a permissions value and a mode value.  As a side-effect mode will get set
     * if this found any 'mode'-like stuff so the caller can know whether mode 
     * has been handled yet.   The same story for permission value.  If it has
     * not been set then we know it needs to default permissions from the caller.
     */
    // mri: rb_io_extract_modeenc
    public static int extractModeEncoding(ThreadContext context, 
            IOEncodable ioEncodable, IRubyObject[] pm, IRubyObject options, boolean secondTime) {
        int fmode; // OpenFile
        boolean hasEncoding = false;
        int oflags = 0; // ModeFlags
        
        // Give default encodings
        setupReadWriteEncodings(context, ioEncodable, null, null);

        if (pm[VMODE] == null || pm[VMODE].isNil()) {
            fmode = OpenFile.READABLE;
            oflags = ModeFlags.RDONLY;
        } else {
            IRubyObject intMode = TypeConverter.checkIntegerType(context.runtime, pm[VMODE], "to_int");
            
            if (!intMode.isNil()) {
                pm[VMODE] = intMode;
                oflags = RubyNumeric.num2int(intMode);
                fmode = ModeFlags.getOpenFileFlagsFor(oflags);
            } else {
                String p = pm[VMODE].convertToString().asJavaString();
                int colonSplit = p.indexOf(":");
                String mode = colonSplit == -1 ? p : p.substring(0, colonSplit);
                try {
                    fmode = OpenFile.getFModeFromString(mode);
                    oflags = OpenFile.getModeFlagsAsIntFrom(fmode);
                } catch (InvalidValueException e) {
                    throw context.runtime.newArgumentError("illegal access mode " + pm[VMODE]);
                }
                
                if (colonSplit != -1) {
                    hasEncoding = true;
                    parseModeEncoding(context, ioEncodable, p.substring(colonSplit + 1));
                } else {
                    Encoding e = (fmode & OpenFile.BINMODE) != 0 ? ascii8bitEncoding(context.runtime) : null;
                    setupReadWriteEncodings(context, ioEncodable, null, e);
                }
            }
        }
        
        if (options == null || options.isNil()) {
            // FIXME: Set up ecflags
        } else {
            fmode = extractBinmode(context.runtime, options, fmode);
            // Differs from MRI but we open with ModeFlags
            oflags |= OpenFile.getModeFlagsAsIntFrom(fmode);

            // FIXME: What is DEFAULT_TEXTMODE
            
            if (!secondTime) {
                IRubyObject v = hashARef(context.runtime, options, "mode");
                
                if (!v.isNil()) {
                    if (pm[VMODE] != null && !pm[VMODE].isNil()) {
                        throw context.runtime.newArgumentError("mode specified twice");
                    }
                    secondTime = true;
                    pm[VMODE] = v;
                  
                    return extractModeEncoding(context, ioEncodable, pm, options, true);
                }
            } 
            IRubyObject v = hashARef(context.runtime, options, "perm");
            if (!v.isNil()) {
                if (pm[PERM] != null) {
                    if (!pm[PERM].isNil()) throw context.runtime.newArgumentError("perm specified twice");
                    
                    pm[PERM] = v;
                }
            }
        
            if (getEncodingOptionFromObject(context, ioEncodable, options)) {
                if (hasEncoding) throw context.runtime.newArgumentError("encoding specified twice");
            }
            
            
        }
        
        return oflags;
    }

    // mri: rb_io_extract_encoding_option
    public static boolean getEncodingOptionFromObject(ThreadContext context, IOEncodable ioEncodable, IRubyObject options) {
        if (options == null || options.isNil()) return false;
        
        options = TypeConverter.checkHashType(context.runtime, options);        

        // FIXME: This is workaround for MRI compat (they do this differently) and I think a bug: http://bugs.ruby-lang.org/issues/7837
        if (!(options instanceof RubyHash)) throw context.runtime.newArgumentError("wrong number of arguments (3 for 1..2)");


        RubyHash opts = (RubyHash) options;        
        boolean extracted = false;
        Encoding externalEncoding = null;
        
        Ruby runtime = options.getRuntime();
        IRubyObject encodingOpt = opts.fastARef(runtime.newSymbol("encoding"));
        IRubyObject externalOpt = opts.fastARef(runtime.newSymbol("external_encoding"));
        IRubyObject internalOpt = opts.fastARef(runtime.newSymbol("internal_encoding"));
        
        if ((externalOpt != null || internalOpt != null) && encodingOpt != null && !encodingOpt.isNil()) {
                runtime.getWarnings().warn("Ignoring encoding parameter '" + encodingOpt + "': " + 
                        (externalOpt == null ? "internal" : "external") + "_encoding is used");
                encodingOpt = null;
        }
        
        if (externalOpt != null && !externalOpt.isNil()) externalEncoding = toEncoding(context, externalOpt);

        Encoding internalEncoding = null;

        if (internalOpt != null) {
            if (internalOpt.isNil() || internalOpt.asString().toString().equals("-")) {
                internalEncoding = null;
            } else {
                internalEncoding = toEncoding(context, internalOpt);
            }
            
            if (externalEncoding == internalEncoding) internalEncoding = null;
        }
        
        if (encodingOpt != null && !encodingOpt.isNil()) {
            extracted = true;
            
            IRubyObject tmp = encodingOpt.checkStringType19();
            if (!tmp.isNil()) {
                parseModeEncoding(context, ioEncodable, tmp.convertToString().toString());
            } else {
                setupReadWriteEncodings(context, ioEncodable, null, toEncoding(context, encodingOpt));
            }
        } else if (externalOpt != null || internalEncoding != null) {
            extracted = true;
            setupReadWriteEncodings(context, ioEncodable, internalEncoding, externalEncoding);
        }
        
        return extracted;
    }
    
    // mri: rb_io_ext_int_to_encs
    public static void setupReadWriteEncodings(ThreadContext context, IOEncodable encodable, 
            Encoding internal, Encoding external) {
        boolean defaultExternal = false;
        
        if (external == null) {
            external = context.runtime.getDefaultExternalEncoding();
            defaultExternal = true;
        }
        
        if (internal == null && external != ascii8bitEncoding(context.runtime)) {
            internal = context.runtime.getDefaultInternalEncoding();
        }
        
        if (internal == null || internal == external) { // missing internal == nil?
            encodable.setReadEncoding((defaultExternal && internal != external) ? null : external);
            encodable.setWriteEncoding(null);
        } else {
            encodable.setReadEncoding(internal);
            encodable.setWriteEncoding(external);
        }
    }    

    // mri: parse_mode_enc
    public static void parseModeEncoding(ThreadContext context, IOEncodable ioEncodable, String option) {
        Ruby runtime = context.runtime;
        EncodingService service = runtime.getEncodingService();
        Encoding intEncoding = null;

        String[] encs = option.split(":", 2);

        if (encs[0].toLowerCase().startsWith("bom|utf-")) {
            ioEncodable.setBOM(true);
            encs[0] = encs[0].substring(4);
        }

        Encoding extEncoding = service.getEncodingFromString(encs[0]);

        if (encs.length > 1) {
            if (encs[1].equals("-")) {
                // null;
            } else {
                intEncoding = service.getEncodingFromString(encs[1]);
            }
        }

        setupReadWriteEncodings(context, ioEncodable, intEncoding, extEncoding);
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy