English Wikipedia @ Freddythechick:Database reports/Featured articles by size/Configuration

From English Wikipedia @ Freddythechick

This report is updated every 7 days.

Source code

<syntaxhighlight lang="rust"> /* Copyright 2023 Kunal Mehta <legoktm@debian.org>

This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version.

This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.

You should have received a copy of the GNU General Public License along with this program. If not, see <http://www.gnu.org/licenses/>.

*/

use anyhow::Result; use dbreps2::{str_vec, Frequency, Report}; use mwbot::Bot; use mysql_async::prelude::*; use mysql_async::Conn; use wikipedia_prosesize::prosesize;

pub struct Row {

   title: String,
   prose_size: u64,
   word_count: u64,

}

pub struct FeaturedBySize {

   pub(crate) bot: Bot,

}

impl Report<Row> for FeaturedBySize {

   fn title(&self) -> &'static str {
       "Featured articles by size"
   }
   fn frequency(&self) -> Frequency {
       Frequency::Weekly
   }
   fn query(&self) -> &'static str {
       r#"

/* featuredbysize.rs SLOW_OK */ SELECT

 page_title

FROM

 page
 JOIN categorylinks ON cl_from = page_id

WHERE

 cl_to = "Featured_articles"
 AND page_namespace = 0

"#

   }
   async fn run_query(&self, conn: &mut Conn) -> Result<Vec<Row>> {
       let pages: Vec<String> = conn.query(self.query()).await?;
       let mut rows = vec![];
       let mut handles = vec![];
       for title in pages {
           let page = self.bot.page(&title)?;
           handles.push(tokio::spawn(async move {
               let html = page.html().await?;
               let size = prosesize(html);
               Result::<_, anyhow::Error>::Ok((title, size))
           }));
       }
       for handle in handles {
           let (title, size) = handle.await??;
           /* println!("{title}"); */
           rows.push(Row {
               title,
               prose_size: size.prose_size(),
               word_count: size.word_count(),
           })
       }
       rows.sort_by_key(|row| row.prose_size);
       rows.reverse();
       Ok(rows)
   }
   fn intro(&self) -> &'static str {
       "Articles in Category:Featured articles sorted by prose size"
   }
   fn headings(&self) -> Vec<&'static str> {
       vec!["Page", "Prose size", "Word count"]
   }
   fn format_row(&self, row: &Row) -> Vec<String> {
       str_vec![
           format!("[[{}]]", row.title.replace('_', " ")),
           row.prose_size,
           row.word_count
       ]
   }
   fn code(&self) -> &'static str {
       include_str!("featuredbysize.rs")
   }

} </syntaxhighlight>