commit 5b7122a2a1533c433659d18e1a668b1938aa36b7 · bretton.dev/coves

+6 -3

aggregators/kagi-news/src/html_parser.py

···

       78
        
                   Perspective(

     

       79
        
                       actor=p['actor'],

     

       80
        
                       description=p['description'],

     

       81
       -
                       source_url=p['source_url']

     

       0
        
       
     

       82
        
                   )

     

       83
        
                   for p in parsed['perspectives']

     

       84
        
               ]

     
···

       230
        
               actor, rest = full_text.split(':', 1)

     

       231
        
               actor = actor.strip()

     

       232
        
       

     

       233
       -
               # Find the <a> tag for source URL

     

       234
        
               a_tag = li.find('a')

     

       235
        
               source_url = a_tag['href'] if a_tag and a_tag.get('href') else ""

     

       0
        
       
     

       236
        
       

     

       237
        
               # Extract description (between colon and source link)

     

       238
        
               # Remove the source citation part in parentheses

     
···

       250
        
               return {

     

       251
        
                   'actor': actor,

     

       252
        
                   'description': description,

     

       253
       -
                   'source_url': source_url

     

       0
        
       
     

       254
        
               }

     

       255
        
       

     

       256
        
           def _extract_sources(self, soup: BeautifulSoup) -> List[Dict]:

···

       78
        
                   Perspective(

     

       79
        
                       actor=p['actor'],

     

       80
        
                       description=p['description'],

     

       81
       +
                       source_url=p['source_url'],

     

       82
       +
                       source_name=p.get('source_name', '')

     

       83
        
                   )

     

       84
        
                   for p in parsed['perspectives']

     

       85
        
               ]

     
···

       231
        
               actor, rest = full_text.split(':', 1)

     

       232
        
               actor = actor.strip()

     

       233
        
       

     

       234
       +
               # Find the <a> tag for source URL and name

     

       235
        
               a_tag = li.find('a')

     

       236
        
               source_url = a_tag['href'] if a_tag and a_tag.get('href') else ""

     

       237
       +
               source_name = a_tag.get_text(strip=True) if a_tag else ""

     

       238
        
       

     

       239
        
               # Extract description (between colon and source link)

     

       240
        
               # Remove the source citation part in parentheses

     
···

       252
        
               return {

     

       253
        
                   'actor': actor,

     

       254
        
                   'description': description,

     

       255
       +
                   'source_url': source_url,

     

       256
       +
                   'source_name': source_name

     

       257
        
               }

     

       258
        
       

     

       259
        
           def _extract_sources(self, soup: BeautifulSoup) -> List[Dict]:

aggregators/kagi-news/src/models.py

···

       20
        
           actor: str

     

       21
        
           description: str

     

       22
        
           source_url: str

     

       0
        
       
     

       23
        
       

     

       24
        
       

     

       25
        
       @dataclass

···

       20
        
           actor: str

     

       21
        
           description: str

     

       22
        
           source_url: str

     

       23
       +
           source_name: str = ""  # Name of the source (e.g., "The Straits Times")

     

       24
        
       

     

       25
        
       

     

       26
        
       @dataclass

+11 -7

aggregators/kagi-news/src/richtext_formatter.py

···

       42
        
                   builder.add_bold("Highlights:")

     

       43
        
                   builder.add_text("\n")

     

       44
        
                   for highlight in story.highlights:

     

       45
       -
                       builder.add_text(f"• {highlight}\n")

     

       46
        
                   builder.add_text("\n")

     

       47
        
       

     

       48
        
               # Perspectives (if present)

     
···

       53
        
                       # Bold the actor name

     

       54
        
                       actor_with_colon = f"{perspective.actor}:"

     

       55
        
                       builder.add_bold(actor_with_colon)

     

       56
       -
                       builder.add_text(f" {perspective.description} (")

     

       57
        
       

     

       58
       -
                       # Add link to source

     

       59
       -
                       source_link_text = "Source"

     

       60
       -
                       builder.add_link(source_link_text, perspective.source_url)

     

       61
       -
                       builder.add_text(")\n")

     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       62
        
                   builder.add_text("\n")

     

       63
        
       

     

       64
        
               # Quote (if present)

     
···

       74
        
                   for source in story.sources:

     

       75
        
                       builder.add_text("• ")

     

       76
        
                       builder.add_link(source.title, source.url)

     

       77
       -
                       builder.add_text(f" - {source.domain}\n")

     

       78
        
                   builder.add_text("\n")

     

       79
        
       

     

       80
        
               # Kagi News attribution

···

       42
        
                   builder.add_bold("Highlights:")

     

       43
        
                   builder.add_text("\n")

     

       44
        
                   for highlight in story.highlights:

     

       45
       +
                       builder.add_text(f"• {highlight}\n\n")

     

       46
        
                   builder.add_text("\n")

     

       47
        
       

     

       48
        
               # Perspectives (if present)

     
···

       53
        
                       # Bold the actor name

     

       54
        
                       actor_with_colon = f"{perspective.actor}:"

     

       55
        
                       builder.add_bold(actor_with_colon)

     

       56
       +
                       builder.add_text(f" {perspective.description}")

     

       57
        
       

     

       58
       +
                       # Add link to source if available

     

       59
       +
                       if perspective.source_url:

     

       60
       +
                           builder.add_text(" (")

     

       61
       +
                           source_link_text = perspective.source_name if perspective.source_name else "Source"

     

       62
       +
                           builder.add_link(source_link_text, perspective.source_url)

     

       63
       +
                           builder.add_text(")")

     

       64
       +
       

     

       65
       +
                       builder.add_text("\n\n")

     

       66
        
                   builder.add_text("\n")

     

       67
        
       

     

       68
        
               # Quote (if present)

     
···

       78
        
                   for source in story.sources:

     

       79
        
                       builder.add_text("• ")

     

       80
        
                       builder.add_link(source.title, source.url)

     

       81
       +
                       builder.add_text(f" - {source.domain}\n\n")

     

       82
        
                   builder.add_text("\n")

     

       83
        
       

     

       84
        
               # Kagi News attribution