]> gitweb.michael.orlitzky.com - dead/htsn-import.git/blob - htsn-import.cabal
Add the initial implementation of TSN.XML.ScheduleChanges.
[dead/htsn-import.git] / htsn-import.cabal
1 name: htsn-import
2 version: 0.0.5
3 cabal-version: >= 1.8
4 author: Michael Orlitzky
5 maintainer: Michael Orlitzky <michael@orlitzky.com>
6 category: Utils
7 license: GPL-3
8 license-file: doc/LICENSE
9 build-type: Simple
10 extra-source-files:
11 doc/dbschema/*.png
12 doc/htsn-importrc.example
13 doc/man1/htsn-import.1
14 doc/README.development
15 doc/TODO
16 makefile
17 schema/*.dtd
18 schemagen/AutoRacingResultsXML/*.xml
19 schemagen/Auto_Racing_Schedule_XML/*.xml
20 schemagen/CBASK_3PPctXML/*.xml
21 schemagen/Cbask_All_Tourn_Teams_XML/*.xml
22 schemagen/CBASK_AssistsXML/*.xml
23 schemagen/Cbask_Awards_XML/*.xml
24 schemagen/CBASK_BlocksXML/*.xml
25 schemagen/Cbask_Conf_Standings_XML/*.xml
26 schemagen/Cbask_DivII_III_Indv_Stats_XML/*.xml
27 schemagen/Cbask_DivIII_Team_Stats_XML/*.xml
28 schemagen/Cbask_DivII_Team_Stats_XML/*.xml
29 schemagen/CBASK_FGPctXML/*.xml
30 schemagen/CBASK_FoulsXML/*.xml
31 schemagen/CBASK_FTPctXML/*.xml
32 schemagen/Cbask_Indv_Scoring_XML/*.xml
33 schemagen/CBASK_Lineup_XML/*.xml
34 schemagen/CBASK_MinutesXML/*.xml
35 schemagen/Cbask_Polls_XML/*.xml
36 schemagen/cbaskpreviewxml/*.xml
37 schemagen/CBASK_ReboundsXML/*.xml
38 schemagen/CBASK_ScoringLeadersXML/*.xml
39 schemagen/Cbask_Team_ThreePT_Made_XML/*.xml
40 schemagen/Cbask_Team_ThreePT_PCT_XML/*.xml
41 schemagen/Cbask_Team_Win_Pct_XML/*.xml
42 schemagen/CBASK_TopTwentyFiveResult_XML/*.xml
43 schemagen/Cbask_Top_Twenty_Five_XML/*.xml
44 schemagen/Cbask_Tourn_Awards_XML/*.xml
45 schemagen/Cbask_Tourn_Champs_XML/*.xml
46 schemagen/Cbask_Tourn_Indiv_XML/*.xml
47 schemagen/Cbask_Tourn_Leaders_XML/*.xml
48 schemagen/Cbask_Tourn_MVP_XML/*.xml
49 schemagen/Cbask_Tourn_Records_XML/*.xml
50 schemagen/cflpreviewxml/*.xml
51 schemagen/Heartbeat/*.xml
52 schemagen/Injuries_Detail_XML/*.xml
53 schemagen/injuriesxml/*.xml
54 schemagen/jfilexml/*.xml
55 schemagen/LeagueScheduleXML/*.xml
56 schemagen/Matchup_NBA_NHL_XML/*.xml
57 schemagen/Minor_Baseball_League_Leaders_XML/*.xml
58 schemagen/Minor_Baseball_Standings_XML/*.xml
59 schemagen/Minor_Baseball_Transactions_XML/*.xml
60 schemagen/minorscoresxml/*.xml
61 schemagen/mlbbattingavgxml/*.xml
62 schemagen/mlbdoublesleadersxml/*.xml
63 schemagen/MLB_ERA_Leaders/*.xml
64 schemagen/MLB_Fielding_XML/*.xml
65 schemagen/MLBGamesPlayedXML/*.xml
66 schemagen/MLB_Gaming_Matchup_XML/*.xml
67 schemagen/MLBGIDPXML/*.xml
68 schemagen/MLBHitByPitchXML/*.xml
69 schemagen/mlbhitsleadersxml/*.xml
70 schemagen/mlbhomerunsxml/*.xml
71 schemagen/MLBHRFreqXML/*.xml
72 schemagen/MLBIntWalksXML/*.xml
73 schemagen/MLBKORateXML/*.xml
74 schemagen/MLB_Lineup_XML/*.xml
75 schemagen/MLB_Matchup_XML/*.xml
76 schemagen/mlbonbasepctxml/*.xml
77 schemagen/MLBOPSXML/*.xml
78 schemagen/MLB_Pitching_Appearances_Leaders/*.xml
79 schemagen/MLB_Pitching_Balks_Leaders/*.xml
80 schemagen/MLB_Pitching_CG_Leaders/*.xml
81 schemagen/MLB_Pitching_ER_Allowed_Leaders/*.xml
82 schemagen/MLB_Pitching_Hit_Batters_Leaders/*.xml
83 schemagen/MLB_Pitching_Hits_Allowed_Leaders/*.xml
84 schemagen/MLB_Pitching_HR_Allowed_Leaders/*.xml
85 schemagen/MLB_Pitching_IP_Leaders/*.xml
86 schemagen/MLB_Pitching_Runs_Allowed_Leaders/*.xml
87 schemagen/MLB_Pitching_Saves_Leaders/*.xml
88 schemagen/MLB_Pitching_Shut_Outs_Leaders/*.xml
89 schemagen/MLB_Pitching_Starts_Leaders/*.xml
90 schemagen/MLB_Pitching_Strike_Outs_Leaders/*.xml
91 schemagen/MLB_Pitching_Walks_Leaders/*.xml
92 schemagen/MLB_Pitching_WHIP_Leaders/*.xml
93 schemagen/MLB_Pitching_Wild_Pitches_Leaders/*.xml
94 schemagen/MLB_Pitching_Win_Percentage_Leaders/*.xml
95 schemagen/MLB_Pitching_WL_Leaders/*.xml
96 schemagen/MLBPlateAppsXML/*.xml
97 schemagen/mlbpreviewxml/*.xml
98 schemagen/mlbrbisxml/*.xml
99 schemagen/mlbrunsleadersxml/*.xml
100 schemagen/MLBSacFliesXML/*.xml
101 schemagen/MLBSacrificesXML/*.xml
102 schemagen/MLBSBSuccessXML/*.xml
103 schemagen/mlbsluggingpctxml/*.xml
104 schemagen/mlbstandxml/*.xml
105 schemagen/mlbstandxml_preseason/*.xml
106 schemagen/mlbstolenbasexml/*.xml
107 schemagen/mlbtotalbasesleadersxml/*.xml
108 schemagen/mlbtriplesleadersxml/*.xml
109 schemagen/MLBWalkRateXML/*.xml
110 schemagen/mlbwalksleadersxml/*.xml
111 schemagen/MLBXtraBaseHitsXML/*.xml
112 schemagen/MLS_Preview_XML/*.xml
113 schemagen/NBA3PPctXML/*.xml
114 schemagen/NBAAssistsXML/*.xml
115 schemagen/NBABlocksXML/*.xml
116 schemagen/nbaconfrecxml/*.xml
117 schemagen/nbadaysxml/*.xml
118 schemagen/nbadivisionsxml/*.xml
119 schemagen/NBAFGPctXML/*.xml
120 schemagen/NBAFoulsXML/*.xml
121 schemagen/NBAFTPctXML/*.xml
122 schemagen/NBA_Gaming_Matchup_XML/*.xml
123 schemagen/NBALineupXML/*.xml
124 schemagen/NBAMinutesXML/*.xml
125 schemagen/NBA_Playoff_Matchup_XML/*.xml
126 schemagen/nbapreviewxml/*.xml
127 schemagen/NBAReboundsXML/*.xml
128 schemagen/NBAScorersXML/*.xml
129 schemagen/nbastandxml/*.xml
130 schemagen/NBAStealsXML/*.xml
131 schemagen/nbateamleadersxml/*.xml
132 schemagen/NBA_Team_Stats_XML/*.xml
133 schemagen/nbatripledoublexml/*.xml
134 schemagen/NBATurnoversXML/*.xml
135 schemagen/NCAA_Conference_Schedule_XML/*.xml
136 schemagen/NCAA_FB_Preview_XML/*.xml
137 schemagen/newsxml/*.xml
138 schemagen/nflfirstdownxml/*.xml
139 schemagen/NFLFumbleLeaderXML/*.xml
140 schemagen/NFLGiveTakeXML/*.xml
141 schemagen/NFLInside20XML/*.xml
142 schemagen/NFL_KickingLeaders_XML/*.xml
143 schemagen/NFLKickoffsXML/*.xml
144 schemagen/NFLMondayNightXML/*.xml
145 schemagen/NFL_NBA_Draft_XML/*.xml
146 schemagen/NFL_NCAA_FB_Matchup_XML/*.xml
147 schemagen/NFLPassLeadXML/*.xml
148 schemagen/nflpreviewxml/*.xml
149 schemagen/NFLQBStartsXML/*.xml
150 schemagen/NFL_Roster_XML/*.xml
151 schemagen/NFLSackLeadersXML/*.xml
152 schemagen/nflstandxml/*.xml
153 schemagen/NFLTeamRankingsXML/*.xml
154 schemagen/NFL_Team_Stats_XML/*.xml
155 schemagen/NFLTopPerformanceXML/*.xml
156 schemagen/NFLTotalYardageXML/*.xml
157 schemagen/nhlpreviewxml/*.xml
158 schemagen/Odds_XML/*.xml
159 schemagen/recapxml/*.xml
160 schemagen/Schedule_Changes_XML/*.xml
161 schemagen/scoresxml/*.xml
162 schemagen/Transactions_XML/*.xml
163 schemagen/weatherxml/*.xml
164 schemagen/Weekly_Sched_XML/*.xml
165 schemagen/WNBA3PPctXML/*.xml
166 schemagen/WNBAAssistsXML/*.xml
167 schemagen/WNBABlocksXML/*.xml
168 schemagen/WNBAFGPctXML/*.xml
169 schemagen/WNBAFoulsXML/*.xml
170 schemagen/WNBAFTPctXML/*.xml
171 schemagen/WNBAMinutesXML/*.xml
172 schemagen/WNBAReboundsXML/*.xml
173 schemagen/WNBAScorersXML/*.xml
174 schemagen/wnbastandxml/*.xml
175 schemagen/WNBAStealsXML/*.xml
176 schemagen/WNBA_Team_Leaders_XML/*.xml
177 schemagen/WNBATurnoversXML/*.xml
178 schemagen/WorldBaseballPreviewXML/*.xml
179 test/shell/*.test
180 test/xml/*.xml
181 test/xml/*.dtd
182 synopsis:
183 Import XML files from The Sports Network into an RDBMS.
184 description:
185 /Usage/:
186 .
187 @
188 htsn-import [OPTIONS] [FILES]
189 @
190 .
191 The Sports Network <http://www.sportsnetwork.com/> offers an XML feed
192 containing various sports news and statistics. Our sister program
193 /htsn/ is capable of retrieving the feed and saving the individual
194 XML documents contained therein. But what to do with them?
195 .
196 The purpose of /htsn-import/ is to take these XML documents and
197 get them into something we can use, a relational database management
198 system (RDBMS), loosely known as a SQL database. The structure of
199 relational database, is, well, relational, and the feed XML is not. So
200 there is some work to do before the data can be inserted.
201 .
202 First, we must parse the XML. Each supported document type (see below)
203 has a full pickle/unpickle implementation (\"pickle\" is simply a
204 synonym for serialize here). That means that we parse the entire
205 document into a data structure, and if we pickle (serialize) that data
206 structure, we get the exact same XML document tha we started with.
207 .
208 This is important for two reasons. First, it serves as a second level
209 of validation. The first validation is performed by the XML parser,
210 but if that succeeds and unpicking fails, we know that something is
211 fishy. Second, we don't ever want to be surprised by some new element
212 or attribute showing up in the XML. The fact that we can unpickle the
213 whole thing now means that we won't be surprised in the future.
214 .
215 The aforementioned feature is especially important because we
216 automatically migrate the database schema every time we import a
217 document. If you attempt to import a \"newsxml.dtd\" document, all
218 database objects relating to the news will be created if they do not
219 exist. We don't want the schema to change out from under us without
220 warning, so it's important that no XML be parsed that would result in
221 a different schema than we had previously. Since we can
222 pickle/unpickle everything already, this should be impossible.
223 .
224 Examples and usage documentation are available in the man page.
225
226 executable htsn-import
227 build-depends:
228 base >= 4.6 && < 5,
229 cmdargs >= 0.10.6,
230 configurator >= 0.2,
231 directory >= 1.2,
232 filepath >= 1.3,
233 hslogger >= 1.2,
234 htsn-common >= 0.0.1,
235 hxt >= 9.3,
236 groundhog >= 0.5,
237 groundhog-postgresql >= 0.5,
238 groundhog-sqlite >= 0.5,
239 groundhog-th >= 0.5,
240 MissingH >= 1.2,
241 old-locale >= 1,
242 split >= 0.2,
243 tasty >= 0.8,
244 tasty-hunit >= 0.8,
245 time >= 1.4,
246 transformers >= 0.3,
247 tuple >= 0.2
248
249 main-is:
250 Main.hs
251
252 hs-source-dirs:
253 src/
254
255 other-modules:
256 Backend
257 CommandLine
258 Configuration
259 ConnectionString
260 ExitCodes
261 OptionalConfiguration
262 TSN.Codegen
263 TSN.Database
264 TSN.DbImport
265 TSN.Parse
266 TSN.Picklers
267 TSN.Team
268 TSN.XmlImport
269 TSN.XML.AutoRacingResults
270 TSN.XML.AutoRacingSchedule
271 TSN.XML.GameInfo
272 TSN.XML.Heartbeat
273 TSN.XML.Injuries
274 TSN.XML.InjuriesDetail
275 TSN.XML.JFile
276 TSN.XML.News
277 TSN.XML.Odds
278 TSN.XML.ScheduleChanges
279 TSN.XML.Scores
280 TSN.XML.SportInfo
281 TSN.XML.Weather
282 Xml
283
284 ghc-options:
285 -Wall
286 -fwarn-hi-shadowing
287 -fwarn-missing-signatures
288 -fwarn-name-shadowing
289 -fwarn-orphans
290 -fwarn-type-defaults
291 -fwarn-tabs
292 -fwarn-incomplete-record-updates
293 -fwarn-monomorphism-restriction
294 -fwarn-unused-do-bind
295 -O2
296
297 ghc-prof-options:
298 -prof
299 -fprof-auto
300 -fprof-cafs
301 -- The following unbreak profiling with template haskell. We have
302 -- to build the program twice; once without profile and again with
303 -- these flags.
304 -hisuf hi_p
305 -osuf o_p
306
307
308 test-suite testsuite
309 type: exitcode-stdio-1.0
310 hs-source-dirs: src test
311 main-is: TestSuite.hs
312 build-depends:
313 base >= 4.6 && < 5,
314 cmdargs >= 0.10.6,
315 configurator >= 0.2,
316 directory >= 1.2,
317 filepath >= 1.3,
318 hslogger >= 1.2,
319 htsn-common >= 0.0.1,
320 hxt >= 9.3,
321 groundhog >= 0.5,
322 groundhog-postgresql >= 0.5,
323 groundhog-sqlite >= 0.5,
324 groundhog-th >= 0.5,
325 MissingH >= 1.2,
326 old-locale >= 1,
327 split >= 0.2,
328 tasty >= 0.8,
329 tasty-hunit >= 0.8,
330 time >= 1.4,
331 transformers >= 0.3,
332 tuple >= 0.2
333
334 -- It's not entirely clear to me why I have to reproduce all of this.
335 ghc-options:
336 -Wall
337 -fwarn-hi-shadowing
338 -fwarn-missing-signatures
339 -fwarn-name-shadowing
340 -fwarn-orphans
341 -fwarn-type-defaults
342 -fwarn-tabs
343 -fwarn-incomplete-record-updates
344 -fwarn-monomorphism-restriction
345 -fwarn-unused-do-bind
346 -O2
347
348
349 test-suite doctests
350 type: exitcode-stdio-1.0
351 hs-source-dirs: test
352 main-is: Doctests.hs
353 build-depends:
354 base >= 4.6 && < 5,
355 -- Additional test dependencies.
356 doctest >= 0.9
357
358 -- It's not entirely clear to me why I have to reproduce all of this.
359 ghc-options:
360 -Wall
361 -fwarn-hi-shadowing
362 -fwarn-missing-signatures
363 -fwarn-name-shadowing
364 -fwarn-orphans
365 -fwarn-type-defaults
366 -fwarn-tabs
367 -fwarn-incomplete-record-updates
368 -fwarn-monomorphism-restriction
369 -fwarn-unused-do-bind
370 -rtsopts
371 -threaded
372 -optc-O3
373 -optc-march=native
374 -O2
375
376
377 -- These won't work without shelltestrunner installed in your
378 -- $PATH. Maybe there is some way to tell Cabal that.
379 test-suite shelltests
380 type: exitcode-stdio-1.0
381 hs-source-dirs: test
382 main-is: ShellTests.hs
383
384 build-depends:
385 base >= 4.6 && < 5,
386 cmdargs >= 0.10.6,
387 configurator >= 0.2,
388 directory >= 1.2,
389 filepath >= 1.3,
390 hslogger >= 1.2,
391 htsn-common >= 0.0.1,
392 hxt >= 9.3,
393 groundhog >= 0.5,
394 groundhog-postgresql >= 0.5,
395 groundhog-sqlite >= 0.5,
396 groundhog-th >= 0.5,
397 MissingH >= 1.2,
398 old-locale >= 1,
399 split >= 0.2,
400 process >= 1.1,
401 tasty >= 0.8,
402 tasty-hunit >= 0.8,
403 time >= 1.4,
404 transformers >= 0.3,
405 tuple >= 0.2
406
407
408
409 source-repository head
410 type: git
411 location: http://michael.orlitzky.com/git/htsn-import.git
412 branch: master