Fetch release date
This commit is contained in:
parent
df96c91b4b
commit
4a20c539f6
3 changed files with 51 additions and 2 deletions
|
|
@ -4,3 +4,11 @@ version = "0.1.0"
|
||||||
edition = "2024"
|
edition = "2024"
|
||||||
|
|
||||||
[dependencies]
|
[dependencies]
|
||||||
|
tokio = { version = "1.46.0", default-features = false, features = [
|
||||||
|
"rt-multi-thread",
|
||||||
|
] }
|
||||||
|
futures = "0.3.31"
|
||||||
|
reqwest = "0.12.22"
|
||||||
|
scraper = "0.23.1"
|
||||||
|
regex = "1.11.1"
|
||||||
|
chrono = "0.4.41"
|
||||||
|
|
|
||||||
|
|
@ -22,11 +22,14 @@
|
||||||
packages = {
|
packages = {
|
||||||
default = self.packages.${system}.myapp;
|
default = self.packages.${system}.myapp;
|
||||||
};
|
};
|
||||||
|
|
||||||
# $ nix develop
|
# $ nix develop
|
||||||
devShells.default = pkgs.mkShell {
|
devShells.default = pkgs.mkShell {
|
||||||
|
LD_LIBRARY_PATH = pkgs.lib.makeLibraryPath [pkgs.openssl];
|
||||||
|
|
||||||
packages = [
|
packages = [
|
||||||
pkgs.gnumake
|
pkgs.gnumake
|
||||||
|
pkgs.pkg-config
|
||||||
|
pkgs.openssl
|
||||||
|
|
||||||
# Nix
|
# Nix
|
||||||
pkgs.nixpkgs-fmt
|
pkgs.nixpkgs-fmt
|
||||||
|
|
|
||||||
40
src/main.rs
40
src/main.rs
|
|
@ -1,3 +1,41 @@
|
||||||
|
use chrono::NaiveDate;
|
||||||
|
use regex::Regex;
|
||||||
|
use reqwest::get;
|
||||||
|
use scraper::{Html, Selector};
|
||||||
|
use tokio::runtime::Runtime;
|
||||||
|
|
||||||
fn main() {
|
fn main() {
|
||||||
println!("Hello, world!");
|
let rt = Runtime::new().unwrap();
|
||||||
|
rt.block_on(fetch_release_date("https://lwn.net/Articles/1025629/"));
|
||||||
|
}
|
||||||
|
|
||||||
|
async fn fetch_release_date(url: &str) -> Option<NaiveDate> {
|
||||||
|
let response = get(url).await.unwrap();
|
||||||
|
let response_text = response.text().await.unwrap();
|
||||||
|
|
||||||
|
if let Some(article_text) = Html::parse_document(&response_text)
|
||||||
|
.select(&Selector::parse("div.ArticleText").unwrap())
|
||||||
|
.next()
|
||||||
|
{
|
||||||
|
if let Some(yes) = article_text.select(&Selector::parse("p").unwrap()).last() {
|
||||||
|
let re = Regex::new(
|
||||||
|
r#"(?m)\(Alternatively, this item will become freely\n\s* available on ([A-Z][a-z]+ [0-9]{2}, [0-9]{4})\)"#,
|
||||||
|
)
|
||||||
|
.unwrap();
|
||||||
|
if let Some(cap) = re.captures(&yes.inner_html()) {
|
||||||
|
if let Some(date) = cap.get(1) {
|
||||||
|
return NaiveDate::parse_from_str(date.as_str(), "%B %d, %Y").ok();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
None
|
||||||
|
}
|
||||||
|
|
||||||
|
async fn fetch_paid_articles() -> Option<Vec<String>> {
|
||||||
|
let response = get("https://lwn.net/headlines/rss").await.unwrap();
|
||||||
|
let response_text = response.text().await.unwrap();
|
||||||
|
|
||||||
|
None
|
||||||
}
|
}
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue