infochimps / imw

Infinite Monkeywrench - A frameworks for collecting, peeling, and sharing delicious bananas of data.

commit  57f7273dcd930bd6e1a4c6c287af5b5c2fdbaf77
tree    72adaeec4d181324bde111e662a1657652a62970
parent  737e3d1e7530d5d867f0e4be7f6855c89ee6ab0c
imw / Manifest
100644 173 lines (172 sloc) 4.973 kb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
CHANGELOG
Manifest
README-commands
README-license
README-organization.txt
README-overview
README.rdoc
Rakefile
TAGS
TODO
TODO-scraper.TODO
etc/directories.yaml
etc/icss/metadata-rights.icss.yaml
etc/icss/skel.icss.yaml
etc/imwrc.rb
etc/taxonomy.yaml
imw.org
lib/imw.rb
lib/imw/boot.rb
lib/imw/chunk_store/cached_uri.rb
lib/imw/chunk_store/chunk.rb
lib/imw/chunk_store/scrape.rb
lib/imw/chunk_store/scrape_request.rb
lib/imw/chunk_store/tracker.rb
lib/imw/chunk_store/uri_file_store.rb
lib/imw/chunk_store/uri_file_store_junk.rb
lib/imw/dataset.rb
lib/imw/dataset/datamapper.rb
lib/imw/dataset/datamapper/time_and_user_stamps.rb
lib/imw/dataset/loaddump.rb
lib/imw/dataset/old/file_collection.rb
lib/imw/dataset/old/file_collection_utils.rb
lib/imw/dataset/scaffold.rb
lib/imw/dataset/scraped_uri.rb
lib/imw/dataset/scrub/old_working_scrubber.rb
lib/imw/dataset/scrub/scrub.rb
lib/imw/dataset/scrub/scrub_simple_url.rb
lib/imw/dataset/scrub/scrub_test.rb
lib/imw/dataset/scrub/slug.rb
lib/imw/dataset/stats.rb
lib/imw/dataset/stats/counter.rb
lib/imw/dataset/task.rb
lib/imw/dataset/workflow.rb
lib/imw/extract/flat_file_parser.rb
lib/imw/extract/hpricot.rb
lib/imw/extract/html_parser/match_tree.rb
lib/imw/extract/html_parser/matcher.rb
lib/imw/extract/loaddump.rb
lib/imw/files.rb
lib/imw/files/archive.rb
lib/imw/files/basicfile.rb
lib/imw/files/binary.rb
lib/imw/files/compressed_file.rb
lib/imw/files/compressed_files_and_archives.rb
lib/imw/files/compressible.rb
lib/imw/files/csv.rb
lib/imw/files/json.rb
lib/imw/files/sgml.rb
lib/imw/files/text.rb
lib/imw/files/yaml.rb
lib/imw/infochimps/ics-rails-datamapper-migration-maker.rb
lib/imw/infochimps/ics-wreck_and_migrate.rb
lib/imw/infochimps/ics_models_more.rb
lib/imw/infochimps/icss.rb
lib/imw/infochimps/infochimps_models.rb
lib/imw/infochimps/infochimps_resource.rb
lib/imw/infochimps/link.rb
lib/imw/infochimps/metadataset.rb
lib/imw/model/source.rb
lib/imw/package.rb
lib/imw/package/to_archive.rb
lib/imw/parsers.rb
lib/imw/parsers/flat_file_parser.rb
lib/imw/parsers/html_parser.rb
lib/imw/parsers/html_parser/matchers.rb
lib/imw/parsers/line_parser.rb
lib/imw/pool.rb
lib/imw/reconcile.rb
lib/imw/reconcile/canonicalize_by_mapping.rb
lib/imw/rip.rb
lib/imw/rip/database.rb
lib/imw/rip/feed.rb
lib/imw/rip/http.rb
lib/imw/rip/local.rb
lib/imw/transform.rb
lib/imw/utils.rb
lib/imw/utils/archive.rb
lib/imw/utils/components.rb
lib/imw/utils/config.rb
lib/imw/utils/error.rb
lib/imw/utils/extensions/array.rb
lib/imw/utils/extensions/class/attribute_accessors.rb
lib/imw/utils/extensions/core.rb
lib/imw/utils/extensions/dir.rb
lib/imw/utils/extensions/file_core.rb
lib/imw/utils/extensions/fileutils.rb
lib/imw/utils/extensions/find.rb
lib/imw/utils/extensions/hash.rb
lib/imw/utils/extensions/hpricot.rb
lib/imw/utils/extensions/string.rb
lib/imw/utils/extensions/struct.rb
lib/imw/utils/extensions/symbol.rb
lib/imw/utils/extensions/typed_struct.rb
lib/imw/utils/extensions/uri.rb
lib/imw/utils/log.rb
lib/imw/utils/misc.rb
lib/imw/utils/paths.rb
lib/imw/utils/uri.rb
lib/imw/utils/uuid.rb
lib/imw/utils/validate.rb
lib/imw/utils/version.rb
lib/imw/utils/view.rb
lib/imw/utils/view/dump_csv.rb
lib/imw/utils/view/dump_csv_older.rb
lib/tasks/boot.rb
lib/tasks/db.rake
lib/tasks/dev/devutils.rake
lib/tasks/dev/makegem.rake
lib/tasks/dump.rake
lib/tasks/load.rake
lib/tasks/main.rake
lib/tasks/munge.rake
lib/tasks/munge/lint.rake
lib/tasks/paths.rake
lib/tasks/pkg.rake
lib/tasks/pool.rake
lib/tasks/prep.rake
lib/tasks/rip.rake
meta/design/bs/principles.txt
meta/design/notes/about_textile.txt
meta/design/notes/about_w3schema_dublincore.txt
meta/design/notes/about_w3schema_fiddle.txt
meta/design/schema_format.txt
meta/model/imw_struct.rb
meta/model/schemadb_schema.rb
meta/model/tag_list.rb
meta/notes/about-rdoc.txt
old/spec/imw/rip_test.rb
old/spec/imw/utils/validate_test.rb
old/spec/rspec_autotest.rb
spec/imw/#files_spec.rb#
spec/imw/dataset/datamapper/uri_spec.rb
spec/imw/dataset/datamapper_spec_helper.rb
spec/imw/files/samples/sample.csv
spec/imw/files/samples/sample.tsv
spec/imw/files/samples/sample.xml
spec/imw/files/samples/sample.yaml
spec/imw/files_spec.rb
spec/imw/matchers/archive_contents_matcher.rb
spec/imw/matchers/directory_contents_matcher.rb
spec/imw/matchers/file_contents_matcher.rb
spec/imw/matchers/without_regard_to_order_matcher.rb
spec/imw/model/directory_spec.rb
spec/imw/model/files/archive_spec.rb
spec/imw/model/files/bz2_spec.rb
spec/imw/model/files/compressed_file_spec.rb
spec/imw/model/files/compressible_spec.rb
spec/imw/model/files/file_spec.rb
spec/imw/model/files/gz_spec.rb
spec/imw/model/files/rar_spec.rb
spec/imw/model/files/tar_spec.rb
spec/imw/model/files/text_spec.rb
spec/imw/model/files/zip_spec.rb
spec/imw/utils/extensions/file_core_spec.rb
spec/imw/utils/extensions/find_spec.rb
spec/imw/utils/paths_spec.rb
spec/imw/workflow/rip/local_spec.rb
spec/imw/workflow/rip_spec.rb
spec/rcov.opts
spec/spec.opts
spec/spec_helper.rb
spec/support/random.rb