Skip to content

Commit

Permalink
feat(html): Handle mismatched tags
Browse files Browse the repository at this point in the history
- Adds an extension point for handling mismatched tags in malformed HTML
- Adds several mismatched tag handlers
- Implements Display on HtmlDocument
  • Loading branch information
James-LG committed Jul 20, 2023
1 parent 3967080 commit ffac82f
Show file tree
Hide file tree
Showing 9 changed files with 1,145 additions and 326 deletions.
5 changes: 5 additions & 0 deletions .vscode/settings.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"rust-analyzer.linkedProjects": [
"./Cargo.toml"
]
}
55 changes: 29 additions & 26 deletions Cargo.toml
Original file line number Diff line number Diff line change
@@ -1,26 +1,29 @@
[package]
name = "skyscraper"
version = "0.4.0"
authors = ["James La Novara-Gsell <james.lanovara.gsell@gmail.com>"]
edition = "2018"
description = "XPath for HTML web scraping"
license = "MIT"
readme = "README.md"
homepage = "https://github.com/James-LG/Skyscraper"
repository = "https://github.com/James-LG/Skyscraper"
categories = ["parsing"]

# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html

[dependencies]
indextree = "4.3.1"
lazy_static = "1.4.0"
thiserror = "1.0.30"
indexmap = "1.8.2"

[dev-dependencies]
criterion = "0.3"

[[bench]]
name = "benchmarks"
harness = false
[package]
name = "skyscraper"
version = "0.5.0"
authors = ["James La Novara-Gsell <james.lanovara.gsell@gmail.com>"]
edition = "2018"
description = "XPath for HTML web scraping"
license = "MIT"
readme = "README.md"
homepage = "https://github.com/James-LG/Skyscraper"
repository = "https://github.com/James-LG/Skyscraper"
categories = ["parsing"]

# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html

[dependencies]
indextree = "4.3.1"
lazy_static = "1.4.0"
thiserror = "1.0.30"
indexmap = "2.0.0"
log = "0.4.19"

[dev-dependencies]
criterion = "0.5.1"
mockall = "0.11.4"
indoc = "2"

[[bench]]
name = "benchmarks"
harness = false
Loading

0 comments on commit ffac82f

Please sign in to comment.