X-Git-Url: http://gitweb.michael.orlitzky.com/?a=blobdiff_plain;f=src%2FTSN%2FPicklers.hs;h=387f4cf4fe4926d0c436678ca0e2ed509b075049;hb=8c663269b4a2981fd35b60dcaad8ba2de9915dc2;hp=1193abf3c203db8029a8f43589ae89c5f6859c95;hpb=e3272460a03b4bdded1902467310a4190feb333f;p=dead%2Fhtsn-import.git diff --git a/src/TSN/Picklers.hs b/src/TSN/Picklers.hs index 1193abf..387f4cf 100644 --- a/src/TSN/Picklers.hs +++ b/src/TSN/Picklers.hs @@ -3,20 +3,53 @@ -- module TSN.Picklers ( xp_date, - xp_team_id ) + xp_date_padded, + xp_earnings, + xp_gamedate, + xp_racedate, + xp_tba_time, + xp_time, + xp_time_stamp ) where -- System imports. -import Data.Time.Clock ( UTCTime ) +import Data.String.Utils ( replace ) +import Data.Time.Clock ( NominalDiffTime, UTCTime, addUTCTime ) import Data.Time.Format ( formatTime, parseTime ) import System.Locale ( defaultTimeLocale ) -import Text.Printf ( printf ) -import Text.Read ( readMaybe ) import Text.XML.HXT.Arrow.Pickle ( xpText, + xpWrap, xpWrapMaybe ) import Text.XML.HXT.Arrow.Pickle.Xml ( PU ) +-- Local imports. +import TSN.Parse ( + parse_time_stamp, + time_format, + time_stamp_format ) + + +-- | The format string for a base date in m/d/yyyy format. The +-- day/month are not padded at all. This will match for example, +-- +-- * 2/15/1983 +-- * 1/1/0000 +-- +date_format :: String +date_format = "%-m/%-d/%Y" + + +-- | The format string for a base date in mm/dd/yyyy format. The +-- day/month are padded to two characters with zeros. This will +-- match for example, +-- +-- * 02/15/1983 +-- * 01/01/0000 +-- +date_format_padded :: String +date_format_padded = "%0m/%0d/%Y" + -- | (Un)pickle a UTCTime without the time portion. -- @@ -24,30 +57,172 @@ xp_date :: PU UTCTime xp_date = (to_date, from_date) `xpWrapMaybe` xpText where - format = "%-m/%-d/%Y" + to_date :: String -> Maybe UTCTime + to_date = parseTime defaultTimeLocale date_format + + from_date :: UTCTime -> String + from_date = formatTime defaultTimeLocale date_format + +-- | (Un)pickle a UTCTime without the time portion. The day/month are +-- padded to two characters with zeros. +-- +xp_date_padded :: PU UTCTime +xp_date_padded = + (to_date, from_date) `xpWrapMaybe` xpText + where to_date :: String -> Maybe UTCTime - to_date = parseTime defaultTimeLocale format + to_date = parseTime defaultTimeLocale date_format_padded from_date :: UTCTime -> String - from_date = formatTime defaultTimeLocale format + from_date = formatTime defaultTimeLocale date_format_padded + + +-- | Parse \ from an 'AutoRaceResultsListing'. These are +-- essentially 'Int's, but they look like, +-- +-- * 336,826 +-- * 1,000,191 +-- * TBA +-- +xp_earnings :: PU (Maybe Int) +xp_earnings = + (to_earnings, from_earnings) `xpWrap` xpText + where + strip_commas :: String -> String + strip_commas = replace "," "" + + to_earnings :: String -> Maybe Int + to_earnings s + | s == "TBA" = Nothing + | otherwise = (read . strip_commas . show) s + + from_earnings :: Maybe Int -> String + from_earnings Nothing = "" + from_earnings (Just i) = show i + + +-- | (Un)pickle a 'UTCTime' from a \ element in an +-- 'AutoRaceResults' message. +-- +-- Example: +-- +-- 6/1/2014 1:00:00 PM +-- 5/24/2014 2:45:00 PM +-- +xp_racedate :: PU UTCTime +xp_racedate = + (to_racedate, from_racedate) `xpWrapMaybe` xpText + where + format = date_format ++ " " ++ "%-I:%M:%S %p" + to_racedate :: String -> Maybe UTCTime + to_racedate = parseTime defaultTimeLocale format --- | Parse a team_id. This /should/ just be an 'Int', but TSN is doing --- something weird. First of all, player IDs do look like normal --- 'Int's. But the team IDs are all stuck in the triple digits, and --- double-digit team IDs appear to be padded to three characters --- with a leading '0'. So maybe they're treating these as text? + from_racedate :: UTCTime -> String + from_racedate = formatTime defaultTimeLocale format + + +-- | (Un)pickle a UTCTime from a weather forecast's gamedate. Example +-- input looks like, +-- +-- \ +-- +-- When unpickling we get rid of the suffixes \"st\", \"nd\", \"rd\", and +-- \"th\". During pickling, we add them back based on the last digit +-- of the date. -- --- In any case, we do the simplest thing that is correct for all the --- XML we've got: pad it to (only) three digits on pickling. +xp_gamedate :: PU UTCTime +xp_gamedate = + (to_gamedate, from_gamedate) `xpWrapMaybe` xpText + where + format = "%A, %B %-d" + + to_gamedate :: String -> Maybe UTCTime + to_gamedate s = + parseTime defaultTimeLocale format s' + where + s' = case (reverse s) of + (c2:c1:cs) -> let suffix = [c1,c2] + in + case suffix of + "st" -> reverse cs + "nd" -> reverse cs + "rd" -> reverse cs + "th" -> reverse cs + _ -> s -- Unknown suffix, leave it alone. + _ -> s -- The String is less than two characters long, + -- leave it alone. + + + from_gamedate :: UTCTime -> String + from_gamedate d = s ++ (suffix s) + where + s = formatTime defaultTimeLocale format d + + suffix :: String -> String + suffix cs = + case (reverse cs) of + [] -> [] + ('1':_) -> "st" + ('2':_) -> "nd" + ('3':_) -> "rd" + _ -> "th" + + + + + + +-- | (Un)pickle a UTCTime without the date portion. -- -xp_team_id :: PU Int -xp_team_id = - (to_team_id, from_team_id) `xpWrapMaybe` xpText +xp_time :: PU UTCTime +xp_time = + (to_time, from_time) `xpWrapMaybe` xpText where - to_team_id :: String -> Maybe Int - to_team_id = readMaybe + to_time :: String -> Maybe UTCTime + to_time = parseTime defaultTimeLocale time_format + + from_time :: UTCTime -> String + from_time = formatTime defaultTimeLocale time_format + + +-- | (Un)pickle a UTCTime without the date portion, allowing for a +-- value of \"TBA\" (which gets translated to 'Nothing'). +-- +xp_tba_time :: PU (Maybe UTCTime) +xp_tba_time = + (to_time, from_time) `xpWrap` xpText + where + to_time :: String -> Maybe UTCTime + to_time s + | s == "TBA" = Nothing + | otherwise = parseTime defaultTimeLocale time_format s + + from_time :: Maybe UTCTime -> String + from_time Nothing = "" + from_time (Just t) = formatTime defaultTimeLocale time_format t + + + +-- | (Un)pickle the \ element format to/from a 'UTCTime'. +-- +-- Example: \ January 6, 2014, at 10:11 PM ET \ +-- +-- TSN doesn't provide a proper time zone name, so we assume that +-- it's always Eastern Standard Time. EST is UTC-5, so we +-- add/subtract 5 hours to convert to/from UTC. +-- +xp_time_stamp :: PU UTCTime +xp_time_stamp = + (parse_time_stamp, from_time_stamp) `xpWrapMaybe` xpText + where + five_hours :: NominalDiffTime + five_hours = 5 * 60 * 60 + + subtract_five :: UTCTime -> UTCTime + subtract_five = addUTCTime (-1 * five_hours) - from_team_id :: Int -> String - from_team_id = printf "%03d" + from_time_stamp :: UTCTime -> String + from_time_stamp = + formatTime defaultTimeLocale time_stamp_format . subtract_five