···
+
last_river_post_date: float option; (** Timestamp of last River post for this user *)
(** Parse a user registration from JSON-like string format *)
let user_registration_of_string s : user_registration option =
+
(* Format: "email|zulip_id|full_name|timestamp|is_admin|last_river_post_date" *)
match String.split_on_char '|' s with
+
| [email; zulip_id_str; full_name; timestamp_str; is_admin_str; last_river_str] ->
+
let last_river_post_date =
+
if last_river_str = "" || last_river_str = "none" then None
+
else Some (float_of_string last_river_str)
+
zulip_id = int_of_string zulip_id_str;
+
registered_at = float_of_string timestamp_str;
+
is_admin = bool_of_string is_admin_str;
| [email; zulip_id_str; full_name; timestamp_str; is_admin_str] ->
+
(* Backward compatibility - old format without last_river_post_date *)
zulip_id = int_of_string zulip_id_str;
registered_at = float_of_string timestamp_str;
is_admin = bool_of_string is_admin_str;
+
last_river_post_date = None;
| [email; zulip_id_str; full_name; timestamp_str] ->
+
(* Backward compatibility - old format without is_admin and last_river_post_date *)
zulip_id = int_of_string zulip_id_str;
registered_at = float_of_string timestamp_str;
+
last_river_post_date = None;
(** Convert a user registration to string format *)
let user_registration_to_string (reg : user_registration) : string =
+
let last_river_str = match reg.last_river_post_date with
+
| Some t -> string_of_float t
+
Printf.sprintf "%s|%d|%s|%f|%b|%s"
(** Storage key for a user registration by Zulip ID - this is the only storage key we use *)
let storage_key_for_id zulip_id = Printf.sprintf "user:id:%d" zulip_id
···
| None -> is_admin || (zulip_id = default_admin_id)
+
(* Preserve last_river_post_date if user already exists *)
+
let last_river_post_date = match existing_by_id with
+
| Some existing -> existing.last_river_post_date
registered_at = Unix.gettimeofday ();
is_admin = final_is_admin;
let reg_str = user_registration_to_string reg in
···
String.contains domain '.'
+
(** {1 River Integration Helper Functions} *)
+
(** Configuration storage keys for River *)
+
let river_feeds_key = "river:feeds:list"
+
let river_channel_key = "river:channel"
+
let river_polling_enabled_key = "river:polling:enabled"
+
let river_last_sync_key = "river:last_sync"
+
let river_default_channel = "Sandbox-test"
+
(** Feed source codec *)
+
let feed_source_jsont =
+
let make name url = { River.name; url } in
+
Jsont.Object.map ~kind:"FeedSource" make
+
|> Jsont.Object.mem "name" Jsont.string ~enc:(fun s -> s.River.name)
+
|> Jsont.Object.mem "url" Jsont.string ~enc:(fun s -> s.River.url)
+
(** Load feed sources from bot storage *)
+
let load_feed_sources storage =
+
match Bot_storage.get storage ~key:river_feeds_key with
+
| Some json_str when json_str <> "" ->
+
(match Jsont_bytesrw.decode_string' (Jsont.list feed_source_jsont) json_str with
+
Log.debug (fun m -> m "Loaded %d feed sources" (List.length feeds));
+
Log.err (fun m -> m "Failed to parse feed sources: %s" (Jsont.Error.to_string err));
+
Log.debug (fun m -> m "No feed sources configured");
+
(** Save feed sources to bot storage *)
+
let save_feed_sources storage feeds =
+
match Jsont_bytesrw.encode_string' ~format:Jsont.Indent (Jsont.list feed_source_jsont) feeds with
+
Bot_storage.put storage ~key:river_feeds_key ~value:json_str
+
let msg = Printf.sprintf "Failed to encode feed sources: %s" (Jsont.Error.to_string err) in
+
Error (Zulip.create_error ~code:(Other "encoding_error") ~msg ())
+
(** Add a feed source *)
+
let add_feed storage ~name ~url =
+
let feeds = load_feed_sources storage in
+
if List.exists (fun f -> f.River.url = url) feeds then
+
Error (Zulip.create_error ~code:(Other "already_exists")
+
~msg:(Printf.sprintf "Feed with URL %s already exists" url) ())
+
let new_feed = { River.name; url } in
+
save_feed_sources storage (new_feed :: feeds)
+
(** Remove a feed source *)
+
let remove_feed storage ~name =
+
let feeds = load_feed_sources storage in
+
let updated_feeds = List.filter (fun f -> f.River.name <> name) feeds in
+
if List.length updated_feeds = List.length feeds then
+
Error (Zulip.create_error ~code:(Other "not_found")
+
~msg:(Printf.sprintf "Feed '%s' not found" name) ())
+
save_feed_sources storage updated_feeds
+
(** Get target Zulip channel *)
+
let get_river_channel storage =
+
match Bot_storage.get storage ~key:river_channel_key with
+
| Some ch when ch <> "" -> ch
+
| _ -> river_default_channel
+
(** Set target Zulip channel *)
+
let set_river_channel storage channel =
+
Bot_storage.put storage ~key:river_channel_key ~value:channel
+
(** Check if polling is enabled *)
+
let is_river_polling_enabled storage =
+
match Bot_storage.get storage ~key:river_polling_enabled_key with
+
let enable_river_polling storage =
+
Bot_storage.put storage ~key:river_polling_enabled_key ~value:"true"
+
let disable_river_polling storage =
+
Bot_storage.put storage ~key:river_polling_enabled_key ~value:"false"
+
(** Get last sync timestamp *)
+
let get_river_last_sync storage =
+
match Bot_storage.get storage ~key:river_last_sync_key with
+
| Some ts_str when ts_str <> "" ->
+
(try Some (float_of_string ts_str) with _ -> None)
+
(** Update last sync timestamp *)
+
let update_river_last_sync storage timestamp =
+
Bot_storage.put storage ~key:river_last_sync_key ~value:(string_of_float timestamp)
+
(** {1 Command Handlers} *)
(** Handle the 'register' command *)
let handle_register storage sender_email sender_id sender_name custom_email_opt =
(* First, try to fetch the user's profile from the Zulip API to get delivery_email and email *)
···
(String.concat "\n" user_lines)
+
(** Handle River 'feeds' command *)
+
let handle_river_feeds storage =
+
let feeds = load_feed_sources storage in
+
"📡 No River feeds configured yet.\n\nUse `river add-feed <name> <url>` to add a feed."
+
let feed_lines = List.mapi (fun i feed ->
+
Printf.sprintf "%d. **%s**\n URL: `%s`" (i + 1) feed.River.name feed.River.url
+
Printf.sprintf "📡 Configured River feeds (%d):\n\n%s\n\nChannel: #%s"
+
(String.concat "\n\n" feed_lines)
+
(get_river_channel storage)
+
(** Handle River 'add-feed' command *)
+
let handle_river_add_feed storage args =
+
match String.split_on_char ' ' args |> List.filter (fun s -> s <> "") with
+
let url = String.concat " " url_parts in
+
(match add_feed storage ~name ~url with
+
Printf.sprintf "✅ Added feed **%s**\n URL: `%s`\n\nUse `river sync` to fetch posts." name url
+
Printf.sprintf "❌ Failed to add feed: %s" (Zulip.error_message e))
+
"Usage: `river add-feed <name> <url>`\n\nExample: `river add-feed \"OCaml Blog\" https://ocaml.org/blog/feed.xml`"
+
(** Handle River 'remove-feed' command *)
+
let handle_river_remove_feed storage args =
+
let name = String.trim args in
+
"Usage: `river remove-feed <name>`\n\nExample: `river remove-feed \"OCaml Blog\"`"
+
match remove_feed storage ~name with
+
Printf.sprintf "✅ Removed feed: **%s**" name
+
Printf.sprintf "❌ Failed to remove feed: %s" (Zulip.error_message e)
+
(** Handle River 'set-channel' command *)
+
let handle_river_set_channel storage args =
+
let channel = String.trim args in
+
Printf.sprintf "Current channel: #%s\n\nUsage: `river set-channel <channel-name>`\n\nExample: `river set-channel general`"
+
(get_river_channel storage)
+
match set_river_channel storage channel with
+
Printf.sprintf "✅ River posts will now go to #%s" channel
+
Printf.sprintf "❌ Failed to set channel: %s" (Zulip.error_message e)
+
(** Handle River 'start' command *)
+
let handle_river_start storage =
+
match enable_river_polling storage with
+
| Ok () -> "✅ River polling enabled. Feeds will be checked every 5 minutes."
+
| Error e -> Printf.sprintf "❌ Failed to enable polling: %s" (Zulip.error_message e)
+
(** Handle River 'stop' command *)
+
let handle_river_stop storage =
+
match disable_river_polling storage with
+
| Ok () -> "⏸️ River polling disabled. Use `river start` to resume."
+
| Error e -> Printf.sprintf "❌ Failed to disable polling: %s" (Zulip.error_message e)
+
(** Handle River 'status' command *)
+
let handle_river_status storage =
+
let feeds = load_feed_sources storage in
+
let polling_status = if is_river_polling_enabled storage then "✅ Enabled" else "⏸️ Disabled" in
+
let last_sync = match get_river_last_sync storage with
+
| Some ts -> format_timestamp ts
+
Printf.sprintf "📊 River Feed Integration Status:\n\
+
• Target channel: #%s\n\
+
• Feeds configured: %d\n\
+
(get_river_channel storage)
(** Handle the 'help' command *)
let handle_help sender_name sender_email =
+
Printf.sprintf "👋 Hi %s! I'm **Vicuna**, your user registration and feed aggregation assistant.\n\n\
+
**User Registration Commands:**\n\
• `register` - Auto-detect your real email or use Zulip email\n\
• `register <your-email@example.com>` - Register with a specific email\n\
• `whoami` - Show your registration status\n\
• `whois <email|id>` - Look up a registered user\n\
+
• `list` - List all registered users\n\n\
+
**River Feed Commands:**\n\
+
• `river feeds` - List all configured feeds\n\
+
• `river add-feed <name> <url>` - Add a new feed\n\
+
• `river remove-feed <name>` - Remove a feed\n\
+
• `river sync` - Force immediate feed sync\n\
+
• `river status` - Show River integration status\n\
+
• `river set-channel <name>` - Set target Zulip channel\n\
+
• `river start` - Enable automatic polling\n\
+
• `river stop` - Disable automatic polling\n\
• `help` - Show this help message\n\n\
• `register` - Auto-detect your email (your Zulip email is `%s`)\n\
+
• `river add-feed \"OCaml Weekly\" https://ocaml.org/feed.xml`\n\
+
• `river set-channel sandbox-test`\n\n\
Send me a direct message to get started!"
···
handle_whois storage args
+
(* Parse river subcommand *)
+
let (subcmd, subargs) = parse_command args in
+
let subcmd_lower = String.lowercase_ascii subcmd in
+
(match subcmd_lower with
+
| "" | "feeds" | "list" ->
+
handle_river_feeds storage
+
| "add-feed" | "add" ->
+
handle_river_add_feed storage subargs
+
| "remove-feed" | "remove" | "rm" ->
+
handle_river_remove_feed storage subargs
+
| "set-channel" | "channel" ->
+
handle_river_set_channel storage subargs
+
| "start" | "enable" ->
+
handle_river_start storage
+
| "stop" | "disable" ->
+
handle_river_stop storage
+
handle_river_status storage
+
"⏳ Syncing River feeds... (Note: sync requires environment access, use CLI for now)"
+
Printf.sprintf "Unknown river command: `%s`\n\nAvailable: feeds, add-feed, remove-feed, set-channel, start, stop, status, sync" subcmd)
Printf.sprintf "Unknown command: `%s`. Use `help` to see available commands." command
···
| Ok () -> Bot_storage.remove storage ~key
+
(** Normalize a name for fuzzy matching *)
+
let normalize_name name =
+
|> String.lowercase_ascii
+
|> Str.global_replace (Str.regexp "[ \t\n\r]+") " "
+
(** Match user by exact name *)
+
let lookup_user_by_name_exact storage name =
+
let all_ids = get_all_user_ids storage in
+
List.find_map (fun id ->
+
match lookup_user_by_id storage id with
+
| Some user when user.full_name = name -> Some user
+
(** Match user by fuzzy name *)
+
let lookup_user_by_name_fuzzy storage name =
+
let normalized_query = normalize_name name in
+
let all_ids = get_all_user_ids storage in
+
List.find_map (fun id ->
+
match lookup_user_by_id storage id with
+
| Some user when normalize_name user.full_name = normalized_query -> Some user
+
(** Smart user matching for a River post *)
+
let match_user_for_post storage (post : River.post) =
+
let author_email = River.email post in
+
let author_name = River.author post in
+
Log.debug (fun m -> m "Matching user for post by %s (%s)" author_name author_email);
+
(* Try email → name exact → name fuzzy *)
+
match lookup_user_by_email storage author_email with
+
Log.debug (fun m -> m "Matched by email: %s" user.email);
+
(match lookup_user_by_name_exact storage author_name with
+
Log.debug (fun m -> m "Matched by exact name: %s" user.full_name);
+
match lookup_user_by_name_fuzzy storage author_name with
+
Log.debug (fun m -> m "Matched by fuzzy name: %s" user.full_name);
+
Log.debug (fun m -> m "No user match found");
+
(** Convert HTML content to markdown summary *)
+
let content_to_summary content_html ~max_length =
+
let markdown = Markdown_converter.to_markdown content_html in
+
if String.length markdown <= max_length then markdown
+
else String.sub markdown 0 (max_length - 3) ^ "..."
+
(** Format a River post for Zulip *)
+
let format_river_post ~user_match (post : River.post) =
+
match River.summary post with
+
| None -> content_to_summary (River.content post) ~max_length:200
+
| Some user -> Printf.sprintf "By @**%s**" user.full_name
+
| None -> Printf.sprintf "By %s" (River.author post)
+
match River.link post with
+
| Some uri -> Printf.sprintf "\n\n[Read more](%s)" (Uri.to_string uri)
+
Printf.sprintf "%s\n\n%s%s" author_line summary link_line
+
(** Update user's last_river_post_date *)
+
let update_user_river_date storage user new_date =
+
let updated = { user with last_river_post_date = Some new_date } in
+
let reg_str = user_registration_to_string updated in
+
Bot_storage.put storage ~key:(storage_key_for_id user.zulip_id) ~value:reg_str
+
(** Get latest post date from a list of posts *)
+
let get_latest_post_date posts =
+
List.fold_left (fun acc post ->
+
match River.date post with
+
let timestamp = Ptime.to_float_s ptime in
+
| None -> Some timestamp
+
| Some existing -> Some (max existing timestamp))
+
(** Filter posts newer than a timestamp *)
+
let filter_posts_since posts since_opt =
+
List.filter (fun post ->
+
match River.date post with
+
Ptime.to_float_s ptime > since
+
(** Post to Zulip channel *)
+
let post_to_zulip client ~channel ~topic ~content =
+
let stream_message = Zulip.Message.create ~type_:`Channel ~to_:[channel] ~topic ~content () in
+
Zulip.Messages.send client stream_message
+
(** Sync feeds and post new items *)
+
let sync_river_and_post ~env ~storage ~client () =
+
Log.info (fun m -> m "Starting River feed sync");
+
let feeds = load_feed_sources storage in
+
Log.info (fun m -> m "No feeds configured, skipping sync");
+
River.with_session env (fun session ->
+
Log.debug (fun m -> m "Fetching %d feeds" (List.length feeds));
+
let fetched_feeds = List.map (fun source ->
+
Log.debug (fun m -> m "Fetching: %s" source.River.name);
+
River.fetch session source
+
let all_posts = River.posts fetched_feeds in
+
Log.info (fun m -> m "Fetched %d total posts" (List.length all_posts));
+
let users = List.filter_map (lookup_user_by_id storage) (get_all_user_ids storage) in
+
let posted_count = ref 0 in
+
let channel = get_river_channel storage in
+
let new_posts = filter_posts_since all_posts user.last_river_post_date in
+
let user_match = match_user_for_post storage post in
+
let topic = River.title post in
+
let content = format_river_post ~user_match post in
+
Log.info (fun m -> m "Posting to #%s: %s" channel topic);
+
match post_to_zulip client ~channel ~topic ~content with
+
| Ok _response -> incr posted_count
+
| Error e -> Log.err (fun m -> m "Failed to post: %s" (Zulip.error_message e))
+
match get_latest_post_date all_posts with
+
| Some latest -> let _ = update_user_river_date storage user latest in ()
+
let _ = update_river_last_sync storage (Unix.gettimeofday ()) in
+
Log.info (fun m -> m "Sync complete, posted %d items" !posted_count);
+
let msg = Printf.sprintf "Sync failed: %s" (Printexc.to_string exn) in
+
Log.err (fun m -> m "%s" msg);
+
Error (Zulip.create_error ~code:(Other "sync_error") ~msg ())
(** Create the bot handler instance *)
let create_handler config storage identity =