-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtsv.py
112 lines (81 loc) · 3.09 KB
/
tsv.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
#!/usr/bin/env python2.7
# tsv.py: a module for writing TSV (tab-separated value) files
"""
This module defines two classes: a TsvWriter, which can be constructed on a
stream to allow writing TSV data lines and #-delimited comments to that stream,
and a TsvReader, which can be constructed on a stream and iterated over to
obtain lists of the values from each non-comment line in the stream.
TSV is most useful as the basis for other, more tightly specified file formats.
Examples of how to use this module are available here:
https://github.com/adamnovak/tsv/blob/master/README.md
"""
class TsvWriter(object):
"""
Represents a writer for tab-separated value files containing #-delimited
comments.
"""
def __init__(self, stream):
"""
Make a new TsvWriter for writing TSV data to the given stream.
"""
# This holds the stream
self.stream = stream
def line(self, *args):
"""
Write the given values to the file, as a TSV line. Args holds a list of
all arguments passed. Any argument that stringifies to a string legal as
a TSV data item can be written.
"""
self.list_line(args)
def list_line(self, line):
"""
Write the given iterable of values (line) to the file as items on the
same line. Any argument that stringifies to a string legal as a TSV data
item can be written.
Does not copy the line or build a big string in memory.
"""
if len(line) == 0:
return
self.stream.write(str(line[0]))
for item in line[1:]:
self.stream.write("\t")
self.stream.write(str(item))
self.stream.write("\n")
def comment(self, text):
"""
Write the given text as a TSV comment. text must be a string containing
no newlines.
"""
self.stream.write("# {}\n".format(text))
def close(self):
"""
Close the underlying stream.
"""
self.stream.close()
class TsvReader(object):
"""
Represents a reader for tab-separated value files. Skips over comments
starting with #. Can be iterated over.
Field values consisting of only whitespace are not allowed.
"""
def __init__(self, stream):
"""
Make a new TsvReader to read from the given stream.
"""
self.stream = stream
def __iter__(self):
"""
Yields lists of all fields on each line, as strings, until all lines are
exhausted. Strips whitespace around field contents.
"""
for line in self.stream:
line = line.strip()
if line == "" or line[0] == "#":
# Skip comments and empty lines
continue
yield map(str.strip, line.split("\t"))
def close(self):
"""
Close the underlying stream.
"""
self.stream.close()