From fe9345602b6750f09c9616c6caeb1fd465e7380a Mon Sep 17 00:00:00 2001 From: retoor Date: Sat, 30 Nov 2024 23:46:08 +0100 Subject: [PATCH] Updated cargo sources and history management. --- 12bitfloat_rust/isspam_v1.rs | 45 ++----- 12bitfloat_rust/isspam_v2.rs | 140 ++++++++++++++++++++ 12bitfloat_rust/{isspam.rs => isspam_v3.rs} | 49 ++++--- 12bitfloat_rust/risspam/Cargo.toml | 1 + 12bitfloat_rust/risspam/src/main.rs | 49 ++++--- 5 files changed, 220 insertions(+), 64 deletions(-) create mode 100644 12bitfloat_rust/isspam_v2.rs rename 12bitfloat_rust/{isspam.rs => isspam_v3.rs} (74%) diff --git a/12bitfloat_rust/isspam_v1.rs b/12bitfloat_rust/isspam_v1.rs index 83b6686..782349f 100644 --- a/12bitfloat_rust/isspam_v1.rs +++ b/12bitfloat_rust/isspam_v1.rs @@ -1,5 +1,6 @@ -#!+[feature(let_chains)] +#![feature(let_chains)] +use std::{env, fs}; fn clean_content(content: &str) -> String { let alloed_ichars = "01234567891abcdefghijklmnopqrstuvwxyz \n.,!?"; @@ -98,17 +99,17 @@ fn analyze(data: &str) { } fn main() { -// // Read in files from args -// for arg in env::args() { -// let Ok(text) = fs::read_to_string(arg) else { -// eprintln!("{arg} isn't a valid file or couldn't be read"); -// continue; -// }; -// -// analyze(&text); -// } - - analyze(&SPAM1); + // Read in files from args + for arg in env::args().skip(1) { // skip program arg + let Ok(text) = fs::read_to_string(&arg) else { + eprintln!("{arg} isn't a valid file or couldn't be read"); + continue; + }; + + analyze(&text); + } + +// analyze(&SPAM1); } static FORBIDDEN_WORDS: &'static [&'static str] = &[ @@ -118,23 +119,3 @@ static FORBIDDEN_WORDS: &'static [&'static str] = &[ "transaction", "essential", "managing", "contact", "contacting", "understanding", "assets", "funds" ]; -static SPAM1: &'static str = "HIRE Century Web Recovery TO RECOVER YOUR LOST BITCOIN - If you’ve lost your Bitcoin to an online scam, hiring a professional recovery service can significantly improve your chances of getting your funds back. Century Web Recovery specializes in Bitcoin recovery, helping victims reclaim their stolen assets. Here’s what you need to know: - - Understanding the Recovery Process - The recovery process begins with contacting Century Web Recovery. Their team will guide you through the steps necessary to initiate an investigation into your case. Understanding the process is key to managing your expectations. - - Documenting Your Case - To facilitate recovery, it’s essential to document all relevant information regarding the scam. This includes transaction records, wallet addresses, and any communications with the scammer. Century Web Recovery will help you gather this information to build a strong case. - - Investigation and Tracking - Once you hire Century Web Recovery, their experts will begin investigating your case. They use sophisticated tools to track the stolen Bitcoin, identifying the paths taken by the scammers. This tracing is crucial for successful recovery. - - Freezing Stolen Assets - Quick action is vital in recovering stolen Bitcoin.Century Web Recovery works directly with cryptocurrency exchanges to freeze any stolen assets, preventing the scammers from cashing out your funds. This collaboration is essential for a successful recovery. - - Legal Support and Guidance - If necessary, Century Web Recovery can provide legal support. They will guide you on reporting the scam to law enforcement and assist in filing any legal claims. Their expertise in crypto-related cases ensures you receive the best advice on how to proceed. - - If you’ve lost Bitcoin to an online scam, don’t hesitate. Hire Century Web Recovery to recover your lost assets and regain your financial security."; - diff --git a/12bitfloat_rust/isspam_v2.rs b/12bitfloat_rust/isspam_v2.rs new file mode 100644 index 0000000..83b6686 --- /dev/null +++ b/12bitfloat_rust/isspam_v2.rs @@ -0,0 +1,140 @@ +#!+[feature(let_chains)] + + +fn clean_content(content: &str) -> String { + let alloed_ichars = "01234567891abcdefghijklmnopqrstuvwxyz \n.,!?"; + + let clean_content = content.chars() + .filter(|&c| alloed_ichars.contains(c)) + .collect::(); + + clean_content +} + +fn get_sentences(content: &str) -> Vec<&str> { + let mut sentences = content.split('.') + .map(|s| s.trim_start()) // Remove leading whitespace + .collect::>(); + + // Remove last "sentence" if didn't end with a dot + if let Some(last) = sentences.last() && !last.ends_with('.') { + sentences.pop(); + } + + sentences +} + +fn get_words(sentences: &str) -> impl Iterator + Clone { + sentences.split_whitespace() +} + +fn is_fully_capitalized_word(word: &str) -> bool { + word.chars() + .all(|c| !c.is_ascii_alphanumeric() || c.is_ascii_uppercase()) +} + +fn get_capitalized_words(content: &str) -> Vec<&str> { + let sentences = get_sentences(content); + let mut cap_words = vec![]; + + for sentence in sentences { + // Always skip the first word since sentences start with + for word in get_words(sentence).skip(1) { + if is_fully_capitalized_word(word) { + cap_words.push(word); + } + } + } + + cap_words +} + +fn get_numbers(content: &str) -> Vec { + let clean = clean_content(content); + + clean.split(|c: char| c.is_ascii_digit()) + .map(|n| n.to_string()) + .collect() +} + +fn get_forbidden_words(content: &str) -> Vec<&str> { + fn check_forbidden(w: &str) -> bool { + FORBIDDEN_WORDS.iter() + .find(|fw| str::eq_ignore_ascii_case(w, fw)) + .is_some() + } + + get_words(content) + .filter(|w| check_forbidden(w)) + .collect() +} + +fn analyze(data: &str) { + let clean_data = clean_content(data); + drop(clean_data); // You aren't actually using clean_data :O + + // All capitalized words + let cap_words = get_capitalized_words(data); + println!("All capitalized words: {}", cap_words.len()); + + // All sentences + let sentences = get_sentences(data); + println!("Sentences: {}", sentences.len()); + + // All words + let words = get_words(data); + println!("Words: {}", words.clone().count()); + + // Numbers + let numbers = get_numbers(data); + println!("Numbers: {}", numbers.len()); + + // Forbidden words + let fw = get_forbidden_words(data); + println!("Forbidden words: {}", fw.len()); + + let word_count_per_sentence = words.count() / sentences.len(); + println!("Word count per sentence: {}", word_count_per_sentence); +} + +fn main() { +// // Read in files from args +// for arg in env::args() { +// let Ok(text) = fs::read_to_string(arg) else { +// eprintln!("{arg} isn't a valid file or couldn't be read"); +// continue; +// }; +// +// analyze(&text); +// } + + analyze(&SPAM1); +} + +static FORBIDDEN_WORDS: &'static [&'static str] = &[ + "recovery", "techie", "http", "https", "digital", "hack", "::", "//", "com", + "@", "crypto", "bitcoin", "wallet", "hacker", "welcome", "whatsapp", "email", "cryptocurrency", + "stolen", "freeze", "quick", "crucial", "tracing", "scammers", "expers", "hire", "century", + "transaction", "essential", "managing", "contact", "contacting", "understanding", "assets", "funds" +]; + +static SPAM1: &'static str = "HIRE Century Web Recovery TO RECOVER YOUR LOST BITCOIN + If you’ve lost your Bitcoin to an online scam, hiring a professional recovery service can significantly improve your chances of getting your funds back. Century Web Recovery specializes in Bitcoin recovery, helping victims reclaim their stolen assets. Here’s what you need to know: + + Understanding the Recovery Process + The recovery process begins with contacting Century Web Recovery. Their team will guide you through the steps necessary to initiate an investigation into your case. Understanding the process is key to managing your expectations. + + Documenting Your Case + To facilitate recovery, it’s essential to document all relevant information regarding the scam. This includes transaction records, wallet addresses, and any communications with the scammer. Century Web Recovery will help you gather this information to build a strong case. + + Investigation and Tracking + Once you hire Century Web Recovery, their experts will begin investigating your case. They use sophisticated tools to track the stolen Bitcoin, identifying the paths taken by the scammers. This tracing is crucial for successful recovery. + + Freezing Stolen Assets + Quick action is vital in recovering stolen Bitcoin.Century Web Recovery works directly with cryptocurrency exchanges to freeze any stolen assets, preventing the scammers from cashing out your funds. This collaboration is essential for a successful recovery. + + Legal Support and Guidance + If necessary, Century Web Recovery can provide legal support. They will guide you on reporting the scam to law enforcement and assist in filing any legal claims. Their expertise in crypto-related cases ensures you receive the best advice on how to proceed. + + If you’ve lost Bitcoin to an online scam, don’t hesitate. Hire Century Web Recovery to recover your lost assets and regain your financial security."; + diff --git a/12bitfloat_rust/isspam.rs b/12bitfloat_rust/isspam_v3.rs similarity index 74% rename from 12bitfloat_rust/isspam.rs rename to 12bitfloat_rust/isspam_v3.rs index 782349f..395cea2 100644 --- a/12bitfloat_rust/isspam.rs +++ b/12bitfloat_rust/isspam_v3.rs @@ -1,5 +1,7 @@ #![feature(let_chains)] +use rayon::prelude::*; +//use rayon::prelude::*; use std::{env, fs}; fn clean_content(content: &str) -> String { @@ -50,11 +52,8 @@ fn get_capitalized_words(content: &str) -> Vec<&str> { cap_words } -fn get_numbers(content: &str) -> Vec { - let clean = clean_content(content); - - clean.split(|c: char| c.is_ascii_digit()) - .map(|n| n.to_string()) +fn get_numbers(clean_content: &str) -> Vec<&str> { + clean_content.split(|c: char| c.is_ascii_digit()) .collect() } @@ -72,7 +71,7 @@ fn get_forbidden_words(content: &str) -> Vec<&str> { fn analyze(data: &str) { let clean_data = clean_content(data); - drop(clean_data); // You aren't actually using clean_data :O +// drop(clean_data); // You aren't actually using clean_data :O // All capitalized words let cap_words = get_capitalized_words(data); @@ -87,29 +86,47 @@ fn analyze(data: &str) { println!("Words: {}", words.clone().count()); // Numbers - let numbers = get_numbers(data); + let numbers = get_numbers(&clean_data); println!("Numbers: {}", numbers.len()); // Forbidden words let fw = get_forbidden_words(data); println!("Forbidden words: {}", fw.len()); - let word_count_per_sentence = words.count() / sentences.len(); - println!("Word count per sentence: {}", word_count_per_sentence); + if sentences.len() > 0 { + let word_count_per_sentence = words.count() / sentences.len(); + println!("Word count per sentence: {}", word_count_per_sentence); + } } fn main() { // Read in files from args - for arg in env::args().skip(1) { // skip program arg - let Ok(text) = fs::read_to_string(&arg) else { - eprintln!("{arg} isn't a valid file or couldn't be read"); - continue; + let mut files = Vec::with_capacity(env::args().len()); + let mut do_parallel = false; + + for arg in env::args().skip(1) { // skip program arg + if arg == "-p" { + do_parallel = true; + } else { + files.push(arg); + } + } + + // Do the work + let work = |file| { + let Ok(text) = fs::read_to_string(&file) else { + eprintln!("{file} isn't a valid file or couldn't be read"); + return; }; analyze(&text); - } - -// analyze(&SPAM1); + }; + + if !do_parallel { + files.iter().for_each(work); + } else { + files.par_iter().for_each(work) + } } static FORBIDDEN_WORDS: &'static [&'static str] = &[ diff --git a/12bitfloat_rust/risspam/Cargo.toml b/12bitfloat_rust/risspam/Cargo.toml index 50e88b9..19d72cc 100644 --- a/12bitfloat_rust/risspam/Cargo.toml +++ b/12bitfloat_rust/risspam/Cargo.toml @@ -4,3 +4,4 @@ version = "0.1.0" edition = "2021" [dependencies] +rayon = "1.10.0" diff --git a/12bitfloat_rust/risspam/src/main.rs b/12bitfloat_rust/risspam/src/main.rs index 782349f..395cea2 100644 --- a/12bitfloat_rust/risspam/src/main.rs +++ b/12bitfloat_rust/risspam/src/main.rs @@ -1,5 +1,7 @@ #![feature(let_chains)] +use rayon::prelude::*; +//use rayon::prelude::*; use std::{env, fs}; fn clean_content(content: &str) -> String { @@ -50,11 +52,8 @@ fn get_capitalized_words(content: &str) -> Vec<&str> { cap_words } -fn get_numbers(content: &str) -> Vec { - let clean = clean_content(content); - - clean.split(|c: char| c.is_ascii_digit()) - .map(|n| n.to_string()) +fn get_numbers(clean_content: &str) -> Vec<&str> { + clean_content.split(|c: char| c.is_ascii_digit()) .collect() } @@ -72,7 +71,7 @@ fn get_forbidden_words(content: &str) -> Vec<&str> { fn analyze(data: &str) { let clean_data = clean_content(data); - drop(clean_data); // You aren't actually using clean_data :O +// drop(clean_data); // You aren't actually using clean_data :O // All capitalized words let cap_words = get_capitalized_words(data); @@ -87,29 +86,47 @@ fn analyze(data: &str) { println!("Words: {}", words.clone().count()); // Numbers - let numbers = get_numbers(data); + let numbers = get_numbers(&clean_data); println!("Numbers: {}", numbers.len()); // Forbidden words let fw = get_forbidden_words(data); println!("Forbidden words: {}", fw.len()); - let word_count_per_sentence = words.count() / sentences.len(); - println!("Word count per sentence: {}", word_count_per_sentence); + if sentences.len() > 0 { + let word_count_per_sentence = words.count() / sentences.len(); + println!("Word count per sentence: {}", word_count_per_sentence); + } } fn main() { // Read in files from args - for arg in env::args().skip(1) { // skip program arg - let Ok(text) = fs::read_to_string(&arg) else { - eprintln!("{arg} isn't a valid file or couldn't be read"); - continue; + let mut files = Vec::with_capacity(env::args().len()); + let mut do_parallel = false; + + for arg in env::args().skip(1) { // skip program arg + if arg == "-p" { + do_parallel = true; + } else { + files.push(arg); + } + } + + // Do the work + let work = |file| { + let Ok(text) = fs::read_to_string(&file) else { + eprintln!("{file} isn't a valid file or couldn't be read"); + return; }; analyze(&text); - } - -// analyze(&SPAM1); + }; + + if !do_parallel { + files.iter().for_each(work); + } else { + files.par_iter().for_each(work) + } } static FORBIDDEN_WORDS: &'static [&'static str] = &[