Browse Source

Working Verse of the day parsing.

Steve Thielemann 1 month ago
parent
commit
f09cee1576
1 changed files with 27 additions and 1 deletions
  1. 27 1
      src/parse.rs

+ 27 - 1
src/parse.rs

@@ -16,12 +16,34 @@ pub fn find_vod(html: &String) -> Result<String> {
     // let a_selector = scraper::Selector::parse(r#"div>a[href^="/bible/"]"#).unwrap();
     let mut result: Vec<(String, String)> = Vec::new();
 
+    // How about this?
+    {
+        let vod_div_select = scraper::Selector::parse("main>div>div>div>div").unwrap();
+        if let Some(vod_div) = document.select(&vod_div_select).next() {
+            // Ok, search just in this div for things of interest.
+            let h1_select = scraper::Selector::parse("h1").unwrap();
+            let h1 = vod_div.select(&h1_select).next().unwrap();
+            println!("h1 = {:?}", h1.text().collect::<Vec<_>>());
+            let p_select = scraper::Selector::parse("p").unwrap();
+            let p = vod_div.select(&p_select).next().unwrap();
+            println!("p = {:?}", p.text().collect::<Vec<_>>());
+
+            let a_select = scraper::Selector::parse(r#"div[class~="mbs-2"]>a"#).unwrap();
+            for a in vod_div.select(&a_select) {
+                println!("a = {:?}", a.text().collect::<Vec<_>>());
+            }
+        }
+    }
+
+    /* 
     // Verse of the day is div with two a's.
     let h1_selector = scraper::Selector::parse("div>h1").unwrap();
     let h1 = document.select(&h1_selector).next().unwrap();
     println!("{:?}", h1.text().collect::<Vec<_>>());
     let a = next_element(h1).unwrap();
     println!("a : {}", a.html());
+    */
+
     /*
     let a = next_element(a).unwrap();
     println!("a : {}", a.html());
@@ -33,11 +55,13 @@ pub fn find_vod(html: &String) -> Result<String> {
         scraper::Selector::parse(r#"a[href^="/bible/"][class~="no-underline"]"#).unwrap();
     let p_selector = scraper::Selector::parse("div>p").unwrap();
 
+    println!("=====");
+    
     for prev_div in document.select(&prev_div_selector) {
         if let Some(p) = prev_div.select(&p_selector).next() {
             println!("{:?}", p.text().collect::<Vec<_>>());
         }
-        
+
         let mut last_verse = String::new();
         for a in prev_div.select(&a_selector1) {
             if let Some(href) = a.attr("href") {
@@ -49,6 +73,7 @@ pub fn find_vod(html: &String) -> Result<String> {
         println!("-----");
     }
 
+    /*
     println!("And finally...");
     let a_selector =
         scraper::Selector::parse(r#"div>a[href^="/bible/"][class~="no-underline"]"#).unwrap();
@@ -60,6 +85,7 @@ pub fn find_vod(html: &String) -> Result<String> {
             println!("html: {}", a.html());
         };
     }
+    */
     bail!("More dERP!");
 }