Change metadata
This commit is contained in:
45
.vscode/launch.json
vendored
Normal file
45
.vscode/launch.json
vendored
Normal file
@@ -0,0 +1,45 @@
|
||||
{
|
||||
// Verwendet IntelliSense zum Ermitteln möglicher Attribute.
|
||||
// Zeigen Sie auf vorhandene Attribute, um die zugehörigen Beschreibungen anzuzeigen.
|
||||
// Weitere Informationen finden Sie unter https://go.microsoft.com/fwlink/?linkid=830387
|
||||
"version": "0.2.0",
|
||||
"configurations": [
|
||||
{
|
||||
"type": "lldb",
|
||||
"request": "launch",
|
||||
"name": "Debug executable 'no-man-sky'",
|
||||
"cargo": {
|
||||
"args": [
|
||||
"build",
|
||||
"--bin=no-man-sky",
|
||||
"--package=no-man-sky"
|
||||
],
|
||||
"filter": {
|
||||
"name": "no-man-sky",
|
||||
"kind": "bin"
|
||||
}
|
||||
},
|
||||
"args": [],
|
||||
"cwd": "${workspaceFolder}"
|
||||
},
|
||||
{
|
||||
"type": "lldb",
|
||||
"request": "launch",
|
||||
"name": "Debug unit tests in executable 'no-man-sky'",
|
||||
"cargo": {
|
||||
"args": [
|
||||
"test",
|
||||
"--no-run",
|
||||
"--bin=no-man-sky",
|
||||
"--package=no-man-sky"
|
||||
],
|
||||
"filter": {
|
||||
"name": "no-man-sky",
|
||||
"kind": "bin"
|
||||
}
|
||||
},
|
||||
"args": [],
|
||||
"cwd": "${workspaceFolder}"
|
||||
}
|
||||
]
|
||||
}
|
||||
16
Cargo.toml
Normal file
16
Cargo.toml
Normal file
@@ -0,0 +1,16 @@
|
||||
[package]
|
||||
name = "no-man-sky"
|
||||
version = "0.1.0"
|
||||
edition = "2024"
|
||||
publish = ["merlin"]
|
||||
description = "Utility functions to read environment with fallback and values from a file"
|
||||
license = "MIT"
|
||||
repository = "ssh://git@gitea.merlinserver.de:2222/Stefan/merlin_env_helper.git"
|
||||
|
||||
[dependencies]
|
||||
ego-tree = "0.10.0"
|
||||
env_logger = "0.11.8"
|
||||
log = "0.4.27"
|
||||
merlin_env_helper = { version = "0.2.0", registry = "merlin" }
|
||||
reqwest = {version="0.12.15", features=["blocking"]}
|
||||
scraper = "0.23.1"
|
||||
76
snipped.html
Normal file
76
snipped.html
Normal file
@@ -0,0 +1,76 @@
|
||||
<span
|
||||
class="resource-substanzmithoherenergie"
|
||||
style="border: 1px solid #d3d3d3"
|
||||
>
|
||||
<span class="mw-valign-text-bottom" typeof="mw:File">
|
||||
<a href="/de/wiki/Diwasserstoff" title="Diwasserstoff">
|
||||
<img
|
||||
class="mw-file-element lazyload"
|
||||
data-image-key="SUBSTANCE.LAUNCHSUB.1.png"
|
||||
data-image-name="SUBSTANCE.LAUNCHSUB.1.png"
|
||||
data-relevant="1"
|
||||
data-src="https://static.wikia.nocookie.net/nomanssky_gamepedia/images/0/03/SUBSTANCE.LAUNCHSUB.1.png/revision/latest/scale-to-width-down/18?cb=20180725071716"
|
||||
decoding="async"
|
||||
height="18"
|
||||
loading="lazy"
|
||||
src="%3D%3D"
|
||||
width="18"
|
||||
/>
|
||||
</a>
|
||||
</span>
|
||||
</span>
|
||||
<a href="/de/wiki/Diwasserstoff" title="Diwasserstoff">
|
||||
<span class="itemlink ajaxttlink">Diwasserstoff</span>
|
||||
</a>
|
||||
x1 +
|
||||
<span
|
||||
class="resource-konzentrierterflüssigtreibstoff"
|
||||
style="border: 1px solid #d3d3d3"
|
||||
>
|
||||
<span class="mw-valign-text-bottom" typeof="mw:File">
|
||||
<a href="/de/wiki/Sauerstoff" title="Sauerstoff">
|
||||
<img
|
||||
class="mw-file-element lazyload"
|
||||
data-image-key="SUBSTANCE.AIR.1.png"
|
||||
data-image-name="SUBSTANCE.AIR.1.png"
|
||||
data-relevant="1"
|
||||
data-src="https://static.wikia.nocookie.net/nomanssky_gamepedia/images/e/ec/SUBSTANCE.AIR.1.png/revision/latest/scale-to-width-down/18?cb=20221007220715"
|
||||
decoding="async"
|
||||
height="18"
|
||||
loading="lazy"
|
||||
src="%3D%3D"
|
||||
width="18"
|
||||
/>
|
||||
</a>
|
||||
</span>
|
||||
</span>
|
||||
<a href="/de/wiki/Sauerstoff" title="Sauerstoff">
|
||||
<span class="itemlink ajaxttlink">Sauerstoff</span>
|
||||
</a>
|
||||
x1 →
|
||||
<span
|
||||
class="resource-aquatischesmineral-extrakt"
|
||||
style="border: 1px solid #d3d3d3"
|
||||
>
|
||||
<span class="mw-valign-text-bottom" typeof="mw:File">
|
||||
<a href="/de/wiki/Salz" title="Salz">
|
||||
<img
|
||||
class="mw-file-element lazyload"
|
||||
data-image-key="SUBSTANCE.WATER.1.png"
|
||||
data-image-name="SUBSTANCE.WATER.1.png"
|
||||
data-relevant="1"
|
||||
data-src="https://static.wikia.nocookie.net/nomanssky_gamepedia/images/9/9f/SUBSTANCE.WATER.1.png/revision/latest/scale-to-width-down/18?cb=20180726042119"
|
||||
decoding="async"
|
||||
height="18"
|
||||
loading="lazy"
|
||||
src="%3D%3D"
|
||||
width="18"
|
||||
/>
|
||||
</a>
|
||||
</span>
|
||||
</span>
|
||||
<strong class="mw-selflink selflink">
|
||||
<span class="itemlink ajaxttlink">Salz</span>
|
||||
</strong>
|
||||
x1
|
||||
<small>( <i>"Schnelle Formation/Verdunstung"</i>, 0,08 sek./Stück)</small>
|
||||
155
src/main.rs
Normal file
155
src/main.rs
Normal file
@@ -0,0 +1,155 @@
|
||||
use std::{fs::File, io::{Read}};
|
||||
|
||||
use scraper::{ElementRef, Node};
|
||||
use ego_tree::NodeRef;
|
||||
|
||||
fn main() -> Result<(), Box<dyn std::error::Error>> {
|
||||
env_logger::init();
|
||||
let html = read("test.html")?;
|
||||
parse(&html)?;
|
||||
Ok(())
|
||||
}
|
||||
|
||||
|
||||
fn _download_file(url: &str, _path: &str) -> Result<String, Box<dyn std::error::Error>> {
|
||||
// Some simple CLI args requirements...
|
||||
|
||||
eprintln!("Fetching {url:?}...");
|
||||
|
||||
// reqwest::blocking::get() is a convenience function.
|
||||
//
|
||||
// In most cases, you should create/build a reqwest::Client and reuse
|
||||
// it for all requests.
|
||||
let res = reqwest::blocking::get(url)?;
|
||||
|
||||
|
||||
let body = res.text()?;
|
||||
Ok(body)
|
||||
}
|
||||
|
||||
fn read(path: &str) -> Result<String, std::io::Error> {
|
||||
let mut file = File::open(path)?;
|
||||
let mut contents = String::new();
|
||||
file.read_to_string(&mut contents)?;
|
||||
Ok(contents)
|
||||
}
|
||||
|
||||
fn parse(html: &str) -> Result<bool, Box<dyn std::error::Error>> {
|
||||
// Parse the HTML content
|
||||
let document = scraper::Html::parse_document(html);
|
||||
let selector_quelle = scraper::Selector::parse("#Quelle").unwrap();
|
||||
let selector_verwendung = scraper::Selector::parse("#Verwendung").unwrap();
|
||||
let selector_li = scraper::Selector::parse("li").unwrap();
|
||||
|
||||
let elt_quelle= document.select(&selector_quelle).next();
|
||||
|
||||
if elt_quelle.is_none() {
|
||||
eprintln!("No element found with the selector '#Quelle'");
|
||||
return Ok(false);
|
||||
}
|
||||
|
||||
let elt_quelle = elt_quelle.unwrap();
|
||||
|
||||
let mut elt_quelle = elt_quelle.parent().unwrap();
|
||||
|
||||
let mut c = 0;
|
||||
let mut elt_ul = None;
|
||||
|
||||
while elt_quelle. next_sibling().is_some() {
|
||||
|
||||
elt_quelle = elt_quelle.next_sibling().unwrap();
|
||||
|
||||
if !elt_quelle.value().is_element(){
|
||||
continue;
|
||||
}
|
||||
|
||||
let elt = elt_quelle.value().as_element().unwrap();
|
||||
if elt.name() == "ul" {
|
||||
c += 1;
|
||||
|
||||
if c > 1 {
|
||||
elt_ul = Some(elt_quelle);
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
if elt.name() == "h2" {
|
||||
eprintln!("Found 'h2' element, stopping search for 'ul'");
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
if elt_ul.is_none() {
|
||||
eprintln!("No second 'ul' element found after '#Quelle'");
|
||||
return Ok(false);
|
||||
}
|
||||
let elt_ul = ElementRef::wrap(elt_ul.unwrap()).unwrap();
|
||||
let li = elt_ul.select(&selector_li);
|
||||
|
||||
for item in li
|
||||
{
|
||||
parse_li_to_resource(item);
|
||||
}
|
||||
|
||||
let elt_verwendung= document.select(&selector_verwendung).next();
|
||||
|
||||
if elt_verwendung.is_none() {
|
||||
eprintln!("No element found with the selector '#Verwendung'");
|
||||
return Ok(false);
|
||||
}
|
||||
|
||||
let elt_verwendung = elt_verwendung.unwrap();
|
||||
|
||||
Ok(true)
|
||||
}
|
||||
|
||||
fn parse_li_to_resource(item: ElementRef<'_>) {
|
||||
if !item.has_children() {
|
||||
println!("Item has no children, skipping.");
|
||||
return;
|
||||
}
|
||||
|
||||
let mut resource_items = Vec::new();
|
||||
|
||||
let first_child = item.first_child().unwrap();
|
||||
|
||||
resource_items.push(first_child);
|
||||
|
||||
let iter = first_child.next_siblings();
|
||||
|
||||
for next in iter {
|
||||
if next.value().is_text() {
|
||||
resource_items.push(next);
|
||||
}
|
||||
else if next.value().is_element() {
|
||||
if next.value().as_element().unwrap().name() == "span" {
|
||||
parse_resource (resource_items);
|
||||
resource_items = Vec::new();
|
||||
}
|
||||
|
||||
resource_items.push(next);
|
||||
}
|
||||
}
|
||||
|
||||
println!("======================");
|
||||
}
|
||||
|
||||
fn parse_resource(resource_items: Vec<NodeRef<'_, Node>>) {
|
||||
if resource_items.is_empty() {
|
||||
println!("No resource items to parse.");
|
||||
return;
|
||||
}
|
||||
|
||||
println!("Parsing resource items...");
|
||||
|
||||
for item in resource_items {
|
||||
if item.value().is_text() {
|
||||
println!("Text: {}", item.value().as_text().unwrap().text.trim_ascii());
|
||||
continue;
|
||||
}
|
||||
println!("Resource: {:?}", item.value());
|
||||
}
|
||||
|
||||
println!("------------------");
|
||||
|
||||
}
|
||||
8
src/test.html
Normal file
8
src/test.html
Normal file
@@ -0,0 +1,8 @@
|
||||
<html>
|
||||
<body>
|
||||
<img
|
||||
src="%3D%3D"
|
||||
width="18"
|
||||
/>
|
||||
</body>
|
||||
</html>
|
||||
2
src/types/mod.rs
Normal file
2
src/types/mod.rs
Normal file
@@ -0,0 +1,2 @@
|
||||
pub mod types;
|
||||
pub use types::*;
|
||||
0
src/types/types.rs
Normal file
0
src/types/types.rs
Normal file
3
src/util/cmd.rs
Normal file
3
src/util/cmd.rs
Normal file
@@ -0,0 +1,3 @@
|
||||
pub fn parse_command_line_args() -> Vec<String> {
|
||||
std::env::args().skip(1).collect()
|
||||
}
|
||||
2
src/util/mod.rs
Normal file
2
src/util/mod.rs
Normal file
@@ -0,0 +1,2 @@
|
||||
pub mod cmd;
|
||||
pub use cmd::*;
|
||||
Reference in New Issue
Block a user