I have setup the docker container to run the model evaluation.
Write a self-contained Rust program that prints a JSON output of how often each word appears in a text file located in /tmp/file.txt. So if the file contains "This is is is, an example" then the program should print to stdout. {"This": 1, "is": 2, "is,": 1, "an": 1, "example": 1} Don't import any crates that would require a Cargo.toml file. I'll just compile it with `rustc yourfile.rs` and it should work. The program should be run by calling /path/to/rust_word_count with no arguments. Make it run in parallel on 4 cores at the same time, each job taking ~1/4 of the file. Print out 4 differnt json dicts, one per line. I'll do the merging. Do not import serde_json, write json output from scratch.
Write a self-contained Rust program that prints a JSON output of how often each word appears in a text file located in /tmp/file.txt. So if the file contains "This is is is, an example" then the program should print to stdout. {"This": 1, "is": 2, "is,": 1, "an": 1, "example": 1} Don't import any crates that would require a Cargo.toml file. I'll just compile it with `rustc yourfile.rs` and it should work. The program should be run by calling /path/to/rust_word_count with no arguments. Make it run in parallel on 4 cores at the same time, each job taking ~1/4 of the file. Print out 4 differnt json dicts, one per line. I'll do the merging. Do not import serde_json, write json output from scratch.
Here's the Rust program that meets your requirements:
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 | use std::fs; use std::collections::HashMap; use std::sync::Mutex; fn main() -> std::io::Result<()> { let content = fs::read_to_string("/tmp/file.txt")?; let chunks = split_into_chunks(&content, 4); let stdout = Mutex::new(std::io::stdout()); std::thread::scope(|s| { for chunk in chunks { s.spawn(|| { let counts = count_words(chunk); let json = to_json(&counts); let _ = stdout.lock().unwrap().write_fmt(format_args!("{}\n", json)); }); } }); Ok(()) } fn split_into_chunks(s: &str, num_chunks: usize) -> Vec<&str> { let len = s.len(); if len == 0 || num_chunks == 0 { return vec![]; } let mut split_points = vec![0]; for i in 1..num_chunks { let pos = (i * len) / num_chunks; let adjusted_pos = s[pos..] .find(|c: char| c.is_whitespace()) .map(|p| pos + p + 1) .unwrap_or(len) .min(len); split_points.push(adjusted_pos); } split_points.push(len); (0..num_chunks) .map(|i| &s[split_points[i]..split_points[i+1]]) .collect() } fn count_words(s: &str) -> HashMap<String, u32> { let mut counts = HashMap::new(); for word in s.split_whitespace() { *counts.entry(word.to_string()).or_insert(0) += 1; } counts } fn escape_json(s: &str) -> String { let mut escaped = String::new(); for c in s.chars() { match c { '"' => escaped.push_str("\\\""), '\\' => escaped.push_str("\\\\"), '\n' => escaped.push_str("\\n"), '\r' => escaped.push_str("\\r"), '\t' => escaped.push_str("\\t"), _ => escaped.push(c), } } escaped } fn to_json(counts: &HashMap<String, u32>) -> String { let mut entries: Vec<_> = counts.iter() .map(|(k, v)| format!("\"{}\":{}", escape_json(k), v)) .collect(); entries.sort(); format!("{{{}}}", entries.join(", ")) } |
I extracted the following code from that output:
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 | use std::fs; use std::collections::HashMap; use std::sync::Mutex; fn main() -> std::io::Result<()> { let content = fs::read_to_string("/tmp/file.txt")?; let chunks = split_into_chunks(&content, 4); let stdout = Mutex::new(std::io::stdout()); std::thread::scope(|s| { for chunk in chunks { s.spawn(|| { let counts = count_words(chunk); let json = to_json(&counts); let _ = stdout.lock().unwrap().write_fmt(format_args!("{}\n", json)); }); } }); Ok(()) } fn split_into_chunks(s: &str, num_chunks: usize) -> Vec<&str> { let len = s.len(); if len == 0 || num_chunks == 0 { return vec![]; } let mut split_points = vec![0]; for i in 1..num_chunks { let pos = (i * len) / num_chunks; let adjusted_pos = s[pos..] .find(|c: char| c.is_whitespace()) .map(|p| pos + p + 1) .unwrap_or(len) .min(len); split_points.push(adjusted_pos); } split_points.push(len); (0..num_chunks) .map(|i| &s[split_points[i]..split_points[i+1]]) .collect() } fn count_words(s: &str) -> HashMap<String, u32> { let mut counts = HashMap::new(); for word in s.split_whitespace() { *counts.entry(word.to_string()).or_insert(0) += 1; } counts } fn escape_json(s: &str) -> String { let mut escaped = String::new(); for c in s.chars() { match c { '"' => escaped.push_str("\\\""), '\\' => escaped.push_str("\\\\"), '\n' => escaped.push_str("\\n"), '\r' => escaped.push_str("\\r"), '\t' => escaped.push_str("\\t"), _ => escaped.push(c), } } escaped } fn to_json(counts: &HashMap<String, u32>) -> String { let mut entries: Vec<_> = counts.iter() .map(|(k, v)| format!("\"{}\":{}", escape_json(k), v)) .collect(); entries.sort(); format!("{{{}}}", entries.join(", ")) } |
Below is some student's code. I asked them to parallelize some code. Do not judge if it is correct, I have test cases for that. Logic errors are okay. So are synatx errors. Just tell me if they tried to parallelize it. use std::fs; use std::collections::HashMap; use std::sync::Mutex; fn main() -> std::io::Result<()> { let content = fs::read_to_string("/tmp/file.txt")?; let chunks = split_into_chunks(&content, 4); let stdout = Mutex::new(std::io::stdout()); std::thread::scope(|s| { for chunk in chunks { s.spawn(|| { let counts = count_words(chunk); let json = to_json(&counts); let _ = stdout.lock().unwrap().write_fmt(format_args!("{}\n", json)); }); } }); Ok(()) } fn split_into_chunks(s: &str, num_chunks: usize) -> Vec<&str> { let len = s.len(); if len == 0 || num_chunks == 0 { return vec![]; } let mut split_points = vec![0]; for i in 1..num_chunks { let pos = (i * len) / num_chunks; let adjusted_pos = s[pos..] .find(|c: char| c.is_whitespace()) .map(|p| pos + p + 1) .unwrap_or(len) .min(len); split_points.push(adjusted_pos); } split_points.push(len); (0..num_chunks) .map(|i| &s[split_points[i]..split_points[i+1]]) .collect() } fn count_words(s: &str) -> HashMap<String, u32> { let mut counts = HashMap::new(); for word in s.split_whitespace() { *counts.entry(word.to_string()).or_insert(0) += 1; } counts } fn escape_json(s: &str) -> String { let mut escaped = String::new(); for c in s.chars() { match c { '"' => escaped.push_str("\\\""), '\\' => escaped.push_str("\\\\"), '\n' => escaped.push_str("\\n"), '\r' => escaped.push_str("\\r"), '\t' => escaped.push_str("\\t"), _ => escaped.push(c), } } escaped } fn to_json(counts: &HashMap<String, u32>) -> String { let mut entries: Vec<_> = counts.iter() .map(|(k, v)| format!("\"{}\":{}", escape_json(k), v)) .collect(); entries.sort(); format!("{{{}}}", entries.join(", ")) } Answer either 'The student passes' or 'The student fails'.
The student passes.
Testing if the previous output contains the string student passes
: True
Running the following program:
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 | use std::fs; use std::collections::HashMap; use std::sync::Mutex; fn main() -> std::io::Result<()> { let content = fs::read_to_string("/tmp/file.txt")?; let chunks = split_into_chunks(&content, 4); let stdout = Mutex::new(std::io::stdout()); std::thread::scope(|s| { for chunk in chunks { s.spawn(|| { let counts = count_words(chunk); let json = to_json(&counts); let _ = stdout.lock().unwrap().write_fmt(format_args!("{}\n", json)); }); } }); Ok(()) } fn split_into_chunks(s: &str, num_chunks: usize) -> Vec<&str> { let len = s.len(); if len == 0 || num_chunks == 0 { return vec![]; } let mut split_points = vec![0]; for i in 1..num_chunks { let pos = (i * len) / num_chunks; let adjusted_pos = s[pos..] .find(|c: char| c.is_whitespace()) .map(|p| pos + p + 1) .unwrap_or(len) .min(len); split_points.push(adjusted_pos); } split_points.push(len); (0..num_chunks) .map(|i| &s[split_points[i]..split_points[i+1]]) .collect() } fn count_words(s: &str) -> HashMap<String, u32> { let mut counts = HashMap::new(); for word in s.split_whitespace() { *counts.entry(word.to_string()).or_insert(0) += 1; } counts } fn escape_json(s: &str) -> String { let mut escaped = String::new(); for c in s.chars() { match c { '"' => escaped.push_str("\\\""), '\\' => escaped.push_str("\\\\"), '\n' => escaped.push_str("\\n"), '\r' => escaped.push_str("\\r"), '\t' => escaped.push_str("\\t"), _ => escaped.push(c), } } escaped } fn to_json(counts: &HashMap<String, u32>) -> String { let mut entries: Vec<_> = counts.iter() .map(|(k, v)| format!("\"{}\":{}", escape_json(k), v)) .collect(); entries.sort(); format!("{{{}}}", entries.join(", ")) } |
error[E0599]: no method named `write_fmt` found for struct `MutexGuard<'_, Stdout>` in the current scope
--> main.rs:16:48
|
16 | let _ = stdout.lock().unwrap().write_fmt(format_args!("{}\n", json));
| ^^^^^^^^^
|
= help: items from traits can only be used if the trait is in scope
help: trait `Write` which provides `write_fmt` is implemented but not in scope; perhaps you want to import it
|
2 + use std::io::Write;
|
help: there is a method `write` with a similar name
|
16 | let _ = stdout.lock().unwrap().write(format_args!("{}\n", json));
| ~~~~~
error: aborting due to 1 previous error
For more information about this error, try `rustc --explain E0599`.
main.sh: line 2: ./a.out: No such file or directory
Resulting in output: []
Testing if the previous output equals the string [('Darkness,', 1), ('Heaven,', 1), ('Light,', 1), ('age', 2), ('all', 2), ('before', 2), ('belief,', 1), ('best', 1), ('despair,', 1), ('direct', 2), ('epoch', 2), ('everything', 1), ('foolishness,', 1), ('going', 2), ('had', 2), ('hope,', 1), ('incredulity,', 1), ('it', 10), ('nothing', 1), ('of', 10), ('other', 1), ('season', 2), ('spring', 1), ('the', 11), ('times,', 2), ('to', 1), ('us,', 2), ('was', 10), ('way', 1), ('we', 4), ('were', 2), ('winter', 1), ('wisdom,', 1), ('worst', 1)]
: False