jython/src/org/python/modules/_io/_jyio.java at master · jython/jython

History

328 lines (296 loc) · 18.1 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

package org.python.modules._io;

import org.python.core.ArgParser;

import org.python.core.ClassDictInit;

import org.python.core.Py;

import org.python.core.PyException;

import org.python.core.PyInteger;

import org.python.core.PyObject;

import org.python.core.PyString;

import org.python.core.PyStringMap;

import org.python.core.PyType;

import org.python.core.imp;

import org.python.core.io.IOBase;

/**

* The Python _io module implemented in Java.

public class _jyio implements ClassDictInit {

/**

* This method is called when the module is loaded, to populate the namespace (dictionary) of

* the module. The dictionary has been initialised at this point reflectively from the methods

* of this class and this method nulls those entries that ought not to be exposed.

* @param dict namespace of the module

public static void classDictInit(PyObject dict) {

dict.__setitem__("__name__", new PyString("_jyio"));

dict.__setitem__("__doc__", new PyString(__doc__));

dict.__setitem__("DEFAULT_BUFFER_SIZE", DEFAULT_BUFFER_SIZE);

dict.__setitem__("_IOBase", PyIOBase.TYPE);

dict.__setitem__("_RawIOBase", PyRawIOBase.TYPE);

dict.__setitem__("FileIO", PyFileIO.TYPE);

// Define UnsupportedOperation exception by constructing the type

PyObject exceptions = imp.load("exceptions");

PyObject ValueError = exceptions.__getattr__("ValueError");

PyObject IOError = exceptions.__getattr__("IOError");

// Equivalent to class UnsupportedOperation(ValueError, IOError) : pass

UnsupportedOperation = makeException(dict, "UnsupportedOperation", ValueError, IOError);

// Hide from Python

dict.__setitem__("classDictInit", null);

dict.__setitem__("makeException", null);

}

/** A Python class for the <code>UnsupportedOperation</code> exception. */

public static PyType UnsupportedOperation;

/**

* A function that returns a {@link PyException}, which is a Java exception suitable for

* throwing, and that will be raised as an <code>UnsupportedOperation</code> Python exception.

* @param message text message parameter to the Python exception

* @return nascent <code>UnsupportedOperation</code> Python exception

public static PyException UnsupportedOperation(String message) {

return new PyException(UnsupportedOperation, message);

}

/**

* Convenience method for constructing a type object of a Python exception, named as given, and

* added to the namespace of the "_io" module.

* @param dict module dictionary

* @param excname name of the exception

* @param bases one or more bases (superclasses)

* @return the constructed exception type

private static PyType makeException(PyObject dict, String excname, PyObject... bases) {

PyStringMap classDict = new PyStringMap();

classDict.__setitem__("__module__", Py.newString("_io"));

PyType type = (PyType)Py.makeClass(excname, bases, classDict);

dict.__setitem__(excname, type);

return type;

}

/** Default buffer size obtained from {@link IOBase#DEFAULT_BUFFER_SIZE}. */

private static final int _DEFAULT_BUFFER_SIZE = IOBase.DEFAULT_BUFFER_SIZE;

/** Default buffer size for export. */

public static final PyInteger DEFAULT_BUFFER_SIZE = new PyInteger(_DEFAULT_BUFFER_SIZE);

/**

* Open file and return a stream. Raise IOError upon failure. This is a port to Java of the

* CPython _io.open (Modules/_io/_iomodule.c) following the same logic, but expressed with the

* benefits of Java syntax.

* @param args array of arguments from Python call via Jython framework

* @param kwds array of keywords from Python call via Jython framework

* @return the stream object

public static PyObject open(PyObject[] args, String[] kwds) {

// Get the arguments to variables

ArgParser ap = new ArgParser("open", args, kwds, openKwds, 1);

PyObject file = ap.getPyObject(0);

String m = ap.getString(1, "r");

int buffering = ap.getInt(2, -1);

final String encoding = ap.getString(3, null);

final String errors = ap.getString(4, null);

final String newline = ap.getString(5, null);

boolean closefd = Py.py2boolean(ap.getPyObject(6, Py.True));

// Decode the mode string

OpenMode mode = new OpenMode(m) {

@Override

public void validate() {

super.validate();

validate(encoding, errors, newline);

}

};

mode.checkValid();

* Create the Raw file stream. Let the constructor deal with the variants and argument

* checking.

PyFileIO raw = new PyFileIO(file, mode, closefd);

* From the Python documentation for io.open() buffering = 0 to switch buffering off (only

* allowed in binary mode), 1 to select line buffering (only usable in text mode), and an

* integer > 1 to indicate the size of a fixed-size buffer.

* When no buffering argument is given, the default buffering policy works as follows:

* Binary files are buffered in fixed-size chunks; "Interactive" text files (files for which

* isatty() returns True) use line buffering. Other text files use the policy described

* above for binary files.

* In Java, it seems a stream never is *known* to be interactive, but we ask anyway, and

* maybe one day we shall know.

boolean line_buffering = false;

if (buffering == 0) {

if (!mode.binary) {

throw Py.ValueError("can't have unbuffered text I/O");

}

return raw;

} else if (buffering == 1) {

// The stream is to be read line-by-line.

line_buffering = true;

// Force default size for actual buffer

buffering = -1;

} else if (buffering < 0 && raw.isatty()) {

// No buffering argument given but stream is inteeractive.

line_buffering = true;

}

if (buffering < 0) {

* We are still being asked for the default buffer size. CPython establishes the default

* buffer size using fstat(fd), but Java appears to give no clue. A useful study of

* buffer sizes in NIO is http://www.evanjones.ca/software/java-bytebuffers.html . This

* leads us to the fixed choice of _DEFAULT_BUFFER_SIZE (=8KB).

buffering = _DEFAULT_BUFFER_SIZE;

}

* We now know just what particular class of file we are opening, and therefore what stack

* (buffering and text encoding) we should build.

if (buffering == 0) {

// Not buffering, return the raw file object

return raw;

} else {

// We are buffering, so wrap raw into a buffered file

PyObject bufferType = null;

PyObject io = imp.load("io");

if (mode.updating) {

bufferType = io.__getattr__("BufferedRandom");

} else if (mode.writing || mode.appending) {

bufferType = io.__getattr__("BufferedWriter");

} else { // = reading

bufferType = io.__getattr__("BufferedReader");

}

PyInteger pyBuffering = new PyInteger(buffering);

PyObject buffer = bufferType.__call__(raw, pyBuffering);

if (mode.binary) {

// If binary, return the just the buffered file

return buffer;

} else {

// We are opening in text mode, so wrap buffered file in a TextIOWrapper.

PyObject textType = io.__getattr__("TextIOWrapper");

PyObject[] textArgs =

{buffer, ap.getPyObject(3, Py.None), ap.getPyObject(4, Py.None),

ap.getPyObject(5, Py.None), Py.newBoolean(line_buffering)};

PyObject wrapper = textType.__call__(textArgs);

wrapper.__setattr__("mode", new PyString(m));

return wrapper;

}

private static final String[] openKwds = {"file", "mode", "buffering", "encoding", "errors",

"newline", "closefd"};

public static final String __doc__ =

"The io module provides the Python interfaces to stream handling. The\n"

+ "builtin open function is defined in this module.\n" + "\n"

+ "At the top of the I/O hierarchy is the abstract base class IOBase. It\n"

+ "defines the basic interface to a stream. Note, however, that there is no\n"

+ "seperation between reading and writing to streams; implementations are\n"

+ "allowed to throw an IOError if they do not support a given operation.\n"

+ "\n"

+ "Extending IOBase is RawIOBase which deals simply with the reading and\n"

+ "writing of raw bytes to a stream. FileIO subclasses RawIOBase to provide\n"

+ "an interface to OS files.\n" + "\n"

+ "BufferedIOBase deals with buffering on a raw byte stream (RawIOBase). Its\n"

+ "subclasses, BufferedWriter, BufferedReader, and BufferedRWPair buffer\n"

+ "streams that are readable, writable, and both respectively.\n"

+ "BufferedRandom provides a buffered interface to random access\n"

+ "streams. BytesIO is a simple stream of in-memory bytes.\n" + "\n"

+ "Another IOBase subclass, TextIOBase, deals with the encoding and decoding\n"

+ "of streams into text. TextIOWrapper, which extends it, is a buffered text\n"

+ "interface to a buffered raw stream (`BufferedIOBase`). Finally, StringIO\n"

+ "is a in-memory stream for text.\n" + "\n"

+ "Argument names are not part of the specification, and only the arguments\n"

+ "of open() are intended to be used as keyword arguments.\n";

public static final String __doc__open =

"Open file and return a stream. Raise IOError upon failure.\n" + "\n"

+ "file is either a text or byte string giving the name (and the path\n"

+ "if the file isn't in the current working directory) of the file to\n"

+ "be opened or an integer file descriptor of the file to be\n"

+ "wrapped. (If a file descriptor is given, it is closed when the\n"

+ "returned I/O object is closed, unless closefd is set to False.)\n" + "\n"

+ "mode is an optional string that specifies the mode in which the file\n"

+ "is opened. It defaults to 'r' which means open for reading in text\n"

+ "mode. Other common values are 'w' for writing (truncating the file if\n"

+ "it already exists), and 'a' for appending (which on some Unix systems,\n"

+ "means that all writes append to the end of the file regardless of the\n"

+ "current seek position). In text mode, if encoding is not specified the\n"

+ "encoding used is platform dependent. (For reading and writing raw\n"

+ "bytes use binary mode and leave encoding unspecified.) The available\n"

+ "modes are:\n" + "\n"

+ "========= ===============================================================\n"

+ "Character Meaning\n"

+ "--------- ---------------------------------------------------------------\n"

+ "'r' open for reading (default)\n"

+ "'w' open for writing, truncating the file first\n"

+ "'a' open for writing, appending to the end of the file if it exists\n"

+ "'b' binary mode\n" + "'t' text mode (default)\n"

+ "'+' open a disk file for updating (reading and writing)\n"

+ "'U' universal newline mode (for backwards compatibility; unneeded\n"

+ " for new code)\n"

+ "========= ===============================================================\n"

+ "\n"

+ "The default mode is 'rt' (open for reading text). For binary random\n"

+ "access, the mode 'w+b' opens and truncates the file to 0 bytes, while\n"

+ "'r+b' opens the file without truncation.\n" + "\n"

+ "Python distinguishes between files opened in binary and text modes,\n"

+ "even when the underlying operating system doesn't. Files opened in\n"

+ "binary mode (appending 'b' to the mode argument) return contents as\n"

+ "bytes objects without any decoding. In text mode (the default, or when\n"

+ "'t' is appended to the mode argument), the contents of the file are\n"

+ "returned as strings, the bytes having been first decoded using a\n"

+ "platform-dependent encoding or using the specified encoding if given.\n"

+ "\n" + "buffering is an optional integer used to set the buffering policy.\n"

+ "Pass 0 to switch buffering off (only allowed in binary mode), 1 to select\n"

+ "line buffering (only usable in text mode), and an integer > 1 to indicate\n"

+ "the size of a fixed-size chunk buffer. When no buffering argument is\n"

+ "given, the default buffering policy works as follows:\n" + "\n"

+ "* Binary files are buffered in fixed-size chunks; the size of the buffer\n"

+ " is chosen using a heuristic trying to determine the underlying device's\n"

+ " \"block size\" and falling back on `io.DEFAULT_BUFFER_SIZE`.\n"

+ " On many systems, the buffer will typically be 4096 or 8192 bytes long.\n"

+ "\n"

+ "* \"Interactive\" text files (files for which isatty() returns True)\n"

+ " use line buffering. Other text files use the policy described above\n"

+ " for binary files.\n" + "\n"

+ "encoding is the name of the encoding used to decode or encode the\n"

+ "file. This should only be used in text mode. The default encoding is\n"

+ "platform dependent, but any encoding supported by Python can be\n"

+ "passed. See the codecs module for the list of supported encodings.\n"

+ "\n"

+ "errors is an optional string that specifies how encoding errors are to\n"

+ "be handled---this argument should not be used in binary mode. Pass\n"

+ "'strict' to raise a ValueError exception if there is an encoding error\n"

+ "(the default of None has the same effect), or pass 'ignore' to ignore\n"

+ "errors. (Note that ignoring encoding errors can lead to data loss.)\n"

+ "See the documentation for codecs.register for a list of the permitted\n"

+ "encoding error strings.\n" + "\n"

+ "newline controls how universal newlines works (it only applies to text\n"

+ "mode). It can be None, '', '\\n', '\\r', and '\\r\\n'. It works as\n"

+ "follows:\n" + "\n"

+ "* On input, if newline is None, universal newlines mode is\n"

+ " enabled. Lines in the input can end in '\\n', '\\r', or '\\r\\n', and\n"

+ " these are translated into '\\n' before being returned to the\n"

+ " caller. If it is '', universal newline mode is enabled, but line\n"

+ " endings are returned to the caller untranslated. If it has any of\n"

+ " the other legal values, input lines are only terminated by the given\n"

+ " string, and the line ending is returned to the caller untranslated.\n"

+ "\n" + "* On output, if newline is None, any '\\n' characters written are\n"

+ " translated to the system default line separator, os.linesep. If\n"

+ " newline is '', no translation takes place. If newline is any of the\n"

+ " other legal values, any '\\n' characters written are translated to\n"

+ " the given string.\n" + "\n"

+ "If closefd is False, the underlying file descriptor will be kept open\n"

+ "when the file is closed. This does not work when a file name is given\n"

+ "and must be True in that case.\n" + "\n"

+ "open() returns a file object whose type depends on the mode, and\n"

+ "through which the standard file operations such as reading and writing\n"

+ "are performed. When open() is used to open a file in a text mode ('w',\n"

+ "'r', 'wt', 'rt', etc.), it returns a TextIOWrapper. When used to open\n"

+ "a file in a binary mode, the returned class varies: in read binary\n"

+ "mode, it returns a BufferedReader; in write binary and append binary\n"

+ "modes, it returns a BufferedWriter, and in read/write mode, it returns\n"

+ "a BufferedRandom.\n" + "\n"

+ "It is also possible to use a string or bytearray as a file for both\n"

+ "reading and writing. For strings StringIO can be used like a file\n"

+ "opened in a text mode, and for bytes a BytesIO can be used like a file\n"

+ "opened in a binary mode.\n";

}

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

_jyio.java

Latest commit

History

_jyio.java

File metadata and controls