PageRenderTime 43ms CodeModel.GetById 13ms RepoModel.GetById 0ms app.codeStats 1ms

/External.LCA_RESTRICTED/Languages/IronPython/27/Lib/test/test_fileinput.py

http://github.com/IronLanguages/main
Python | 335 lines | 311 code | 11 blank | 13 comment | 4 complexity | 3df24706ab2d1811317d8939ec9e8d5e MD5 | raw file
Possible License(s): CPL-1.0, BSD-3-Clause, ISC, GPL-2.0, MPL-2.0-no-copyleft-exception
  1. '''
  2. Tests for fileinput module.
  3. Nick Mathewson
  4. '''
  5. import unittest
  6. from test.test_support import verbose, TESTFN, run_unittest
  7. from test.test_support import unlink as safe_unlink, check_warnings
  8. import sys, re
  9. from StringIO import StringIO
  10. from fileinput import FileInput, hook_encoded
  11. # The fileinput module has 2 interfaces: the FileInput class which does
  12. # all the work, and a few functions (input, etc.) that use a global _state
  13. # variable. We only test the FileInput class, since the other functions
  14. # only provide a thin facade over FileInput.
  15. # Write lines (a list of lines) to temp file number i, and return the
  16. # temp file's name.
  17. def writeTmp(i, lines, mode='w'): # opening in text mode is the default
  18. name = TESTFN + str(i)
  19. f = open(name, mode)
  20. f.writelines(lines)
  21. f.close()
  22. return name
  23. def remove_tempfiles(*names):
  24. for name in names:
  25. safe_unlink(name)
  26. class LineReader:
  27. def __init__(self):
  28. self._linesread = []
  29. @property
  30. def linesread(self):
  31. try:
  32. return self._linesread[:]
  33. finally:
  34. self._linesread = []
  35. def openhook(self, filename, mode):
  36. self.it = iter(filename.splitlines(True))
  37. return self
  38. def readline(self, size=None):
  39. line = next(self.it, '')
  40. self._linesread.append(line)
  41. return line
  42. def readlines(self, hint=-1):
  43. lines = []
  44. size = 0
  45. while True:
  46. line = self.readline()
  47. if not line:
  48. return lines
  49. lines.append(line)
  50. size += len(line)
  51. if size >= hint:
  52. return lines
  53. def close(self):
  54. pass
  55. class BufferSizesTests(unittest.TestCase):
  56. def test_buffer_sizes(self):
  57. # First, run the tests with default and teeny buffer size.
  58. for round, bs in (0, 0), (1, 30):
  59. try:
  60. t1 = writeTmp(1, ["Line %s of file 1\n" % (i+1) for i in range(15)])
  61. t2 = writeTmp(2, ["Line %s of file 2\n" % (i+1) for i in range(10)])
  62. t3 = writeTmp(3, ["Line %s of file 3\n" % (i+1) for i in range(5)])
  63. t4 = writeTmp(4, ["Line %s of file 4\n" % (i+1) for i in range(1)])
  64. self.buffer_size_test(t1, t2, t3, t4, bs, round)
  65. finally:
  66. remove_tempfiles(t1, t2, t3, t4)
  67. def buffer_size_test(self, t1, t2, t3, t4, bs=0, round=0):
  68. pat = re.compile(r'LINE (\d+) OF FILE (\d+)')
  69. start = 1 + round*6
  70. if verbose:
  71. print '%s. Simple iteration (bs=%s)' % (start+0, bs)
  72. fi = FileInput(files=(t1, t2, t3, t4), bufsize=bs)
  73. lines = list(fi)
  74. fi.close()
  75. self.assertEqual(len(lines), 31)
  76. self.assertEqual(lines[4], 'Line 5 of file 1\n')
  77. self.assertEqual(lines[30], 'Line 1 of file 4\n')
  78. self.assertEqual(fi.lineno(), 31)
  79. self.assertEqual(fi.filename(), t4)
  80. if verbose:
  81. print '%s. Status variables (bs=%s)' % (start+1, bs)
  82. fi = FileInput(files=(t1, t2, t3, t4), bufsize=bs)
  83. s = "x"
  84. while s and s != 'Line 6 of file 2\n':
  85. s = fi.readline()
  86. self.assertEqual(fi.filename(), t2)
  87. self.assertEqual(fi.lineno(), 21)
  88. self.assertEqual(fi.filelineno(), 6)
  89. self.assertFalse(fi.isfirstline())
  90. self.assertFalse(fi.isstdin())
  91. if verbose:
  92. print '%s. Nextfile (bs=%s)' % (start+2, bs)
  93. fi.nextfile()
  94. self.assertEqual(fi.readline(), 'Line 1 of file 3\n')
  95. self.assertEqual(fi.lineno(), 22)
  96. fi.close()
  97. if verbose:
  98. print '%s. Stdin (bs=%s)' % (start+3, bs)
  99. fi = FileInput(files=(t1, t2, t3, t4, '-'), bufsize=bs)
  100. savestdin = sys.stdin
  101. try:
  102. sys.stdin = StringIO("Line 1 of stdin\nLine 2 of stdin\n")
  103. lines = list(fi)
  104. self.assertEqual(len(lines), 33)
  105. self.assertEqual(lines[32], 'Line 2 of stdin\n')
  106. self.assertEqual(fi.filename(), '<stdin>')
  107. fi.nextfile()
  108. finally:
  109. sys.stdin = savestdin
  110. if verbose:
  111. print '%s. Boundary conditions (bs=%s)' % (start+4, bs)
  112. fi = FileInput(files=(t1, t2, t3, t4), bufsize=bs)
  113. self.assertEqual(fi.lineno(), 0)
  114. self.assertEqual(fi.filename(), None)
  115. fi.nextfile()
  116. self.assertEqual(fi.lineno(), 0)
  117. self.assertEqual(fi.filename(), None)
  118. if verbose:
  119. print '%s. Inplace (bs=%s)' % (start+5, bs)
  120. savestdout = sys.stdout
  121. try:
  122. fi = FileInput(files=(t1, t2, t3, t4), inplace=1, bufsize=bs)
  123. for line in fi:
  124. line = line[:-1].upper()
  125. print line
  126. fi.close()
  127. finally:
  128. sys.stdout = savestdout
  129. fi = FileInput(files=(t1, t2, t3, t4), bufsize=bs)
  130. for line in fi:
  131. self.assertEqual(line[-1], '\n')
  132. m = pat.match(line[:-1])
  133. self.assertNotEqual(m, None)
  134. self.assertEqual(int(m.group(1)), fi.filelineno())
  135. fi.close()
  136. class FileInputTests(unittest.TestCase):
  137. def test_zero_byte_files(self):
  138. try:
  139. t1 = writeTmp(1, [""])
  140. t2 = writeTmp(2, [""])
  141. t3 = writeTmp(3, ["The only line there is.\n"])
  142. t4 = writeTmp(4, [""])
  143. fi = FileInput(files=(t1, t2, t3, t4))
  144. line = fi.readline()
  145. self.assertEqual(line, 'The only line there is.\n')
  146. self.assertEqual(fi.lineno(), 1)
  147. self.assertEqual(fi.filelineno(), 1)
  148. self.assertEqual(fi.filename(), t3)
  149. line = fi.readline()
  150. self.assertFalse(line)
  151. self.assertEqual(fi.lineno(), 1)
  152. self.assertEqual(fi.filelineno(), 0)
  153. self.assertEqual(fi.filename(), t4)
  154. fi.close()
  155. finally:
  156. remove_tempfiles(t1, t2, t3, t4)
  157. def test_files_that_dont_end_with_newline(self):
  158. try:
  159. t1 = writeTmp(1, ["A\nB\nC"])
  160. t2 = writeTmp(2, ["D\nE\nF"])
  161. fi = FileInput(files=(t1, t2))
  162. lines = list(fi)
  163. self.assertEqual(lines, ["A\n", "B\n", "C", "D\n", "E\n", "F"])
  164. self.assertEqual(fi.filelineno(), 3)
  165. self.assertEqual(fi.lineno(), 6)
  166. finally:
  167. remove_tempfiles(t1, t2)
  168. def test_unicode_filenames(self):
  169. try:
  170. t1 = writeTmp(1, ["A\nB"])
  171. encoding = sys.getfilesystemencoding()
  172. if encoding is None:
  173. encoding = 'ascii'
  174. fi = FileInput(files=unicode(t1, encoding))
  175. lines = list(fi)
  176. self.assertEqual(lines, ["A\n", "B"])
  177. finally:
  178. remove_tempfiles(t1)
  179. def test_fileno(self):
  180. try:
  181. t1 = writeTmp(1, ["A\nB"])
  182. t2 = writeTmp(2, ["C\nD"])
  183. fi = FileInput(files=(t1, t2))
  184. self.assertEqual(fi.fileno(), -1)
  185. line = fi.next()
  186. self.assertNotEqual(fi.fileno(), -1)
  187. fi.nextfile()
  188. self.assertEqual(fi.fileno(), -1)
  189. line = list(fi)
  190. self.assertEqual(fi.fileno(), -1)
  191. finally:
  192. remove_tempfiles(t1, t2)
  193. def test_opening_mode(self):
  194. try:
  195. # invalid mode, should raise ValueError
  196. fi = FileInput(mode="w")
  197. self.fail("FileInput should reject invalid mode argument")
  198. except ValueError:
  199. pass
  200. try:
  201. # try opening in universal newline mode
  202. t1 = writeTmp(1, ["A\nB\r\nC\rD"], mode="wb")
  203. fi = FileInput(files=t1, mode="U")
  204. lines = list(fi)
  205. self.assertEqual(lines, ["A\n", "B\n", "C\n", "D"])
  206. finally:
  207. remove_tempfiles(t1)
  208. def test_file_opening_hook(self):
  209. try:
  210. # cannot use openhook and inplace mode
  211. fi = FileInput(inplace=1, openhook=lambda f,m: None)
  212. self.fail("FileInput should raise if both inplace "
  213. "and openhook arguments are given")
  214. except ValueError:
  215. pass
  216. try:
  217. fi = FileInput(openhook=1)
  218. self.fail("FileInput should check openhook for being callable")
  219. except ValueError:
  220. pass
  221. try:
  222. # UTF-7 is a convenient, seldom used encoding
  223. t1 = writeTmp(1, ['+AEE-\n+AEI-'], mode="wb")
  224. fi = FileInput(files=t1, openhook=hook_encoded("utf-7"))
  225. lines = list(fi)
  226. self.assertEqual(lines, [u'A\n', u'B'])
  227. finally:
  228. remove_tempfiles(t1)
  229. def test_readline(self):
  230. with open(TESTFN, 'wb') as f:
  231. f.write('A\nB\r\nC\r')
  232. # Fill TextIOWrapper buffer.
  233. f.write('123456789\n' * 1000)
  234. # Issue #20501: readline() shouldn't read whole file.
  235. f.write('\x80')
  236. self.addCleanup(safe_unlink, TESTFN)
  237. fi = FileInput(files=TESTFN, openhook=hook_encoded('ascii'))
  238. # The most likely failure is a UnicodeDecodeError due to the entire
  239. # file being read when it shouldn't have been.
  240. self.assertEqual(fi.readline(), u'A\n')
  241. self.assertEqual(fi.readline(), u'B\r\n')
  242. self.assertEqual(fi.readline(), u'C\r')
  243. with self.assertRaises(UnicodeDecodeError):
  244. # Read to the end of file.
  245. list(fi)
  246. fi.close()
  247. def test_readline_buffering(self):
  248. src = LineReader()
  249. fi = FileInput(files=['line1\nline2', 'line3\n'], openhook=src.openhook)
  250. self.assertEqual(src.linesread, [])
  251. self.assertEqual(fi.readline(), 'line1\n')
  252. self.assertEqual(src.linesread, ['line1\n'])
  253. self.assertEqual(fi.readline(), 'line2')
  254. self.assertEqual(src.linesread, ['line2'])
  255. self.assertEqual(fi.readline(), 'line3\n')
  256. self.assertEqual(src.linesread, ['', 'line3\n'])
  257. self.assertEqual(fi.readline(), '')
  258. self.assertEqual(src.linesread, [''])
  259. self.assertEqual(fi.readline(), '')
  260. self.assertEqual(src.linesread, [])
  261. fi.close()
  262. def test_iteration_buffering(self):
  263. src = LineReader()
  264. fi = FileInput(files=['line1\nline2', 'line3\n'], openhook=src.openhook)
  265. self.assertEqual(src.linesread, [])
  266. self.assertEqual(next(fi), 'line1\n')
  267. self.assertEqual(src.linesread, ['line1\n'])
  268. self.assertEqual(next(fi), 'line2')
  269. self.assertEqual(src.linesread, ['line2'])
  270. self.assertEqual(next(fi), 'line3\n')
  271. self.assertEqual(src.linesread, ['', 'line3\n'])
  272. self.assertRaises(StopIteration, next, fi)
  273. self.assertEqual(src.linesread, [''])
  274. self.assertRaises(StopIteration, next, fi)
  275. self.assertEqual(src.linesread, [])
  276. fi.close()
  277. class Test_hook_encoded(unittest.TestCase):
  278. """Unit tests for fileinput.hook_encoded()"""
  279. def test_modes(self):
  280. with open(TESTFN, 'wb') as f:
  281. # UTF-7 is a convenient, seldom used encoding
  282. f.write('A\nB\r\nC\rD+IKw-')
  283. self.addCleanup(safe_unlink, TESTFN)
  284. def check(mode, expected_lines):
  285. fi = FileInput(files=TESTFN, mode=mode,
  286. openhook=hook_encoded('utf-7'))
  287. lines = list(fi)
  288. fi.close()
  289. self.assertEqual(lines, expected_lines)
  290. check('r', [u'A\n', u'B\r\n', u'C\r', u'D\u20ac'])
  291. check('rU', [u'A\n', u'B\r\n', u'C\r', u'D\u20ac'])
  292. check('U', [u'A\n', u'B\r\n', u'C\r', u'D\u20ac'])
  293. check('rb', [u'A\n', u'B\r\n', u'C\r', u'D\u20ac'])
  294. def test_main():
  295. run_unittest(BufferSizesTests, FileInputTests, Test_hook_encoded)
  296. if __name__ == "__main__":
  297. test_main()