X-Git-Url: http://git.annexia.org/?a=blobdiff_plain;f=goaljobs.ml;h=b5981ad78a6988c9f7c701ac411512ea39ee5f4a;hb=90eaa31d3acea2c640d662323142776a3eab517c;hp=39c90071e796b0ea69b698dcdaebb34053366879;hpb=c4c582dad5435d404490f13acb5ddb706b020f07;p=goaljobs.git diff --git a/goaljobs.ml b/goaljobs.ml index 39c9007..b5981ad 100644 --- a/goaljobs.ml +++ b/goaljobs.ml @@ -16,6 +16,8 @@ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. *) +open CalendarLib + open Unix open Printf @@ -35,8 +37,122 @@ let target_all vs = target (List.fold_left (&&) true vs) let target_exists vs = target (List.fold_left (||) false vs) let require () = () +type period_t = Seconds | Days | Months | Years +let seconds = (1, Seconds) +let sec = seconds and secs = seconds and second = seconds +let minutes = (60, Seconds) +let min = minutes and mins = minutes and minute = minutes +let hours = (3600, Seconds) +let hour = hours +let days = (1, Days) +let day = days +let weeks = (7, Days) +let week = weeks +let months = (1, Months) +let month = months +let years = (1, Years) +let year = years + +let periodic_jobs = ref [] + +(* Register a periodic job. *) +let every ?name i (j, t) f = + let period = i*j, t in (* 5 minutes -> ((5 * 60), Seconds) *) + periodic_jobs := (period, (name, f)) :: !periodic_jobs + +(* [next_time t period] returns the earliest event of [period] + strictly after time [t]. + + Visualising periods as repeated events on a timeline, this + returns [t']: + + {v + events: ---+---------+---------+---------+---------+---------+----- + times: t t' + } + + Note that [period_t] events are not necessarily regular. + eg. The start of a month is not a fixed number of seconds + after the start of the previous month. 'Epoch' refers + to the Unix Epoch (ie. 1970-01-01 00:00:00 UTC). + + If [period = i, Seconds i] then events are when + [t' mod i == 0] when t' is the number of seconds since + the Epoch. This returns the next t' > t. + + If [period = i, Days] then events happen at + midnight UTC every [i] days since the Epoch. + This returns the next midnight > t. + + If [period = i, Months] then events happen at + midnight UTC on the 1st day of the month every [i] months + since the Epoch. This returns midnight on the + 1st day of the next month > t. + + If [period = i, Years] then events happen at + midnight UTC on the 1st day of the year when + [(y - 1970) mod i == 0]. This returns midnight on the + 1st day of the next year > t. *) + +let next_time = + (* Round up 'a' to the next multiple of 'i'. *) + let round_up_float a i = + let r = mod_float a i in + if r = 0. then a +. i else a +. (i -. r) + and round_up a i = + let r = a mod i in + if r = 0 then a + i else a + (i - r) + in + + fun t -> function + | (i, Seconds) -> + let i = float_of_int i in + round_up_float t i + + | (i, Years) -> + let tm = gmtime t in + + (* Round 'tm' up to the first day of the next year. *) + let year = round_up tm.tm_year i in + let tm = { tm with tm_sec = 0; tm_min = 0; tm_hour = 0; + tm_mday = 1; tm_mon = 0; tm_year = year } in + fst (mktime tm) + + | (i, Days) -> + let t = Date.from_unixfloat t in + let t0 = Date.make 1970 1 1 in + + (* Number of whole days since Unix Epoch. *) + let nb_days = Date.Period.safe_nb_days (Date.sub t t0) in + + let nb_days = round_up nb_days i in + let t' = Date.add t0 (Date.Period.day nb_days) in + Date.to_unixfloat t' + + | (i, Months) -> + (* Calculate number of whole months since Unix Epoch. *) + let tm = gmtime t in + let months = 12 * (tm.tm_year - 70) + tm.tm_mon in + + let months = round_up months i in + let t0 = Date.make 1970 1 1 in + let t' = Date.add t0 (Date.Period.month months) in + Date.to_unixfloat t' + let file_exists = Sys.file_exists +let directory_exists path = + let s = + try Some (stat path) + with + | Unix_error (ENOENT, _, _) -> None + | Unix_error (err, _, _) -> + let msg = sprintf "directory_exists: %s: %s" path (error_message err) in + goal_failed msg in + match s with + | Some s -> s.st_kind = S_DIR + | None -> false + let file_newer_than f1 f2 = let stat f = try Some (stat f) @@ -195,13 +311,75 @@ let change_file_extension ext filename = val filter_file_extension : string -> string list -> string *) -(* XXX The Memory is not actually persistent yet. *) -let memory = Hashtbl.create 13 +(* Persistent memory is stored in $HOME/.goaljobs-memory. We have to + * lock this file each time we read or write because multiple concurrent + * jobs may access it at the same time. + * + * XXX Replace this with a more efficient and less fragile implementation. + *) + +type ('a, 'b) alternative = Either of 'a | Or of 'b +let with_memory_locked ?(write = false) f = + let filename = getenv "HOME" // ".goaljobs-memory" in + let fd = openfile filename [O_RDWR; O_CREAT] 0o644 in + lockf fd (if write then F_LOCK else F_RLOCK) 0; + (* If the file is newly created with zero size, write an + * empty hash table. + *) + if (fstat fd).st_size = 0 then ( + let empty : (string, string) Hashtbl.t = Hashtbl.create 13 in + let chan = out_channel_of_descr fd in + output_value chan empty; + Pervasives.flush chan; + ignore (lseek fd 0 SEEK_SET) + ); + + (* Run the function. *) + let r = try Either (f fd) with exn -> Or (exn) in + lockf fd F_ULOCK 0; + match r with + | Either x -> x + | Or exn -> raise exn + +let memory_exists key = + with_memory_locked ( + fun fd -> + let chan = in_channel_of_descr fd in + let memory : (string, string) Hashtbl.t = input_value chan in + Hashtbl.mem memory key + ) + +let memory_get key = + with_memory_locked ( + fun fd -> + let chan = in_channel_of_descr fd in + let memory : (string, string) Hashtbl.t = input_value chan in + try Some (Hashtbl.find memory key) with Not_found -> None + ) + +let memory_set key value = + with_memory_locked ~write:true ( + fun fd -> + let chan = in_channel_of_descr fd in + let memory : (string, string) Hashtbl.t = input_value chan in + Hashtbl.replace memory key value; + let chan = out_channel_of_descr fd in + seek_out chan 0; + output_value chan memory; + Pervasives.flush chan; + ) -let memory_exists = Hashtbl.mem memory -let memory_set = Hashtbl.replace memory -let memory_get k = try Some (Hashtbl.find memory k) with Not_found -> None -let memory_delete = Hashtbl.remove memory +let memory_delete key = + with_memory_locked ~write:true ( + fun fd -> + let chan = in_channel_of_descr fd in + let memory : (string, string) Hashtbl.t = input_value chan in + Hashtbl.remove memory key; + let chan = out_channel_of_descr fd in + seek_out chan 0; + output_value chan memory; + Pervasives.flush chan; + ) let published_goals = ref [] let publish name fn = published_goals := (name, fn) :: !published_goals @@ -213,6 +391,11 @@ let goal_file_exists filename = let msg = sprintf "file '%s' required but not found" filename in goal_failed msg ) +let goal_directory_exists path = + if not (directory_exists path) then ( + let msg = sprintf "directory '%s' required but not found" path in + goal_failed msg + ) let goal_file_newer_than f1 f2 = if not (file_newer_than f1 f2) then ( let msg = sprintf "file %s is required to be newer than %s" f1 f2 in @@ -245,8 +428,18 @@ let goal_memory_exists k = goal_failed msg ) +let guard fn arg = + try fn arg; true + with + | Goal_result (Goal_failed msg) -> + prerr_endline ("error: " ^ msg); + false + | exn -> + prerr_endline (Printexc.to_string exn); + false + (* Run the program. *) -let init () = +let rec init () = let prog = Sys.executable_name in let prog = Filename.basename prog in @@ -264,7 +457,8 @@ let init () = let names = !published_goals in let names = List.map fst names in let names = List.sort compare names in - List.iter print_endline names + List.iter print_endline names; + exit 0 in let argspec = Arg.align [ @@ -290,21 +484,65 @@ Options: let args = List.rev !args in (* Was a goal named on the command line? *) - match args with + (match args with | name :: args -> (match get_goal name with - | Some fn -> fn args + | Some fn -> + exit (if guard fn args then 0 else 1) | None -> eprintf "error: no goal called '%s' was found.\n" name; eprintf "Use %s -l to list all published goals in this script.\n" name; exit 1 ) | [] -> - (* Does a published 'all' goal exist? *) - match get_goal "all" with - | Some fn -> fn [] - | None -> - (* No published 'all' goal. This is only a warning, because - * other top-level code may exist in the script. - *) - eprintf "warning: no 'all' goal found.\n" + (* If periodic jobs exist, fall through. *) + if !periodic_jobs = [] then ( + (* Does a published 'all' goal exist? *) + match get_goal "all" with + | Some fn -> + exit (if guard fn [] then 0 else 1) + | None -> + (* No published 'all' goal. *) + eprintf "error: no goal called 'all' was found.\n"; + exit 1 + ) + ); + + assert (!periodic_jobs <> []); + + (* Run the periodic jobs. Note these run forever, or until killed. *) + while true do + (* Find the next job to run. *) + let now = time () in + let jobs = List.map ( + fun (period, (_, _ as name_f)) -> + next_time now period, name_f + ) !periodic_jobs in + let jobs = List.sort (fun (t1,_) (t2,_) -> compare t1 t2) jobs in + + (* Find all jobs that have the same next time. + * XXX When we can handle parallel jobs we can do better here, + * but until them run all the ones which have the same time + * in series. + *) + let next_t = int_of_float (fst (List.hd jobs)) in + let jobs = List.filter (fun (t, _) -> int_of_float t = next_t) jobs in + + (* Run next job(s) after waiting for the appropriate amount of time. *) + let seconds = next_t - int_of_float now in + eprintf "next job will run in %s\n%!" (printable_seconds seconds); + sleep seconds; + + List.iter ( + fun (_, (name, f)) -> + eprintf "running job: %s\n%!" + (match name with Some name -> name | None -> "[unnamed]"); + ignore (guard f ()) + ) jobs + done + +and printable_seconds s = + if s < 60 then sprintf "%d seconds" s + else if s < 6000 then sprintf "%d minutes, %d seconds" (s/60) (s mod 60) + else if s < 86400 then sprintf "%d hours, %d minutes" (s/3600) (s/60) + else sprintf "about %d days" (s/86400)