diff options
| author | Teddy Wing | 2019-11-02 03:42:46 +0100 | 
|---|---|---|
| committer | Teddy Wing | 2019-11-02 03:42:46 +0100 | 
| commit | 67da99861f5ff0a65016cbc7904d37fb3aa4c013 (patch) | |
| tree | 5f7897d2ab48bd70155b47888af3a44d25642a2f /src | |
| parent | 950c7d1a93ae44da2584345e4a2624d64ef84816 (diff) | |
| download | pdf-urls-67da99861f5ff0a65016cbc7904d37fb3aa4c013.tar.bz2 | |
get_urls_from_pdf: Test extracted URLs
Add a test with a simple text-only PDF with three URLs.
Currently I'm getting the following failure, so visibly the order is not
necessarily the same as the visible order, and multi-line hyperlinks can
be encoded as two link areas:
    ---- tests::get_urls_from_pdf_extracts_urls_from_pdf stdout ----
    thread 'tests::get_urls_from_pdf_extracts_urls_from_pdf' panicked at 'assertion failed: `(left == right)`
      left: `["http://www.gutenberg.org/ebooks/11", "https://ia800908.us.archive.org/6/items/alicesadventures19033gut/19033-h/images/i002.jpg", "https://science.nasa.gov/news-article/black-hole-image-makes-history"]`,
     right: `["http://www.gutenberg.org/ebooks/11", "https://science.nasa.gov/news-article/black-hole-image-makes-history", "https://ia800908.us.archive.org/6/items/alicesadventures19033gut/19033-h/images/i002.jpg", "https://ia800908.us.archive.org/6/items/alicesadventures19033gut/19033-h/images/i002.jpg"]`', src/lib.rs:65:9
Diffstat (limited to 'src')
| -rw-r--r-- | src/lib.rs | 19 | 
1 files changed, 19 insertions, 0 deletions
@@ -46,3 +46,22 @@ pub fn get_urls_from_pdf<P: AsRef<Path>>(path: P) -> Result<Vec<String>> {      Ok(urls)  } + + +#[cfg(test)] +mod tests { +    use super::*; + +    #[test] +    fn get_urls_from_pdf_extracts_urls_from_pdf() { +        let expected = vec![ +            "http://www.gutenberg.org/ebooks/11", +            "https://ia800908.us.archive.org/6/items/alicesadventures19033gut/19033-h/images/i002.jpg", +            "https://science.nasa.gov/news-article/black-hole-image-makes-history", +        ]; + +        let urls = get_urls_from_pdf("testdata/Alice's Adventures in Wonderland.pdf"); + +        assert_eq!(expected, urls.unwrap()); +    } +}  | 
