kean-s ignore list

This commit is contained in:
Quentin 2023-06-19 15:24:22 +02:00
parent 3415e10b37
commit 849c741be9
Signed by: quentin
GPG key ID: E9602264D639FF68
2 changed files with 17 additions and 4 deletions

View file

@ -41,9 +41,11 @@ recovery
## Testing strategy
- Unit testing: parser combinator independently.
- Selected full emails
- Enron 500k
- Unit testing: parser combinator independently (done)
- Selected full emails (done)
- Enron 500k (done)
- Fuzzing (expected)
- Across reference IMAP servers (dovevot, cyrus) (expected)
## Development status

View file

@ -12,6 +12,7 @@ fn test_enron500k() {
let mut d = PathBuf::from(env!("CARGO_MANIFEST_DIR"));
d.push("resources/enron/maildir/");
let prefix_sz = d.as_path().to_str().unwrap().len();
//d.push("kean-s/");
let known_bad_fields = HashSet::from([
"white-s/calendar/113.", // To: east <7..>
@ -59,7 +60,17 @@ fn test_enron500k() {
"kaminski-v/notes_inbox/140.", // To: dogs <breakthrough.>, cats <breaktkhrough.>, risk <breakthrough.>,\r\n\tleaders <breaktkhrough.>
"kaminski-v/notes_inbox/95.", // To + CC failed: cats <breaktkhrough.>, risk <breakthrough.>, leaders <breaktkhrough.>
"kean-s/archiving/untitled/1232.", // To: w/assts <govt.>, mark.palmer@enron.com, karen.denne@enron.com
"kean-s/archiving/untitled/1688.", // To: w/assts <govt.>
"kean-s/sent/198.", // To: w/assts <govt.>, mark.palmer@enron.com, karen.denne@enron.com
"kean-s/reg_risk/9.", // To: w/assts <govt.>
"kean-s/discussion_threads/950.", // To: w/assts <govt.>, mark.palmer@enron.com, karen.denne@enron.com
"kean-s/discussion_threads/577.", // To: w/assts <govt.>
"kean-s/calendar/untitled/1096.", // To: w/assts <govt.>, mark.palmer@enron.com, karen.denne@enron.com
"kean-s/calendar/untitled/640.", // To: w/assts <govt.>
"kean-s/all_documents/640.", // To: w/assts <govt.>
"kean-s/all_documents/1095.", // To: w/assts <govt.>
"kean-s/attachments/2030.", // To: w/assts <govt.>
]);
let known_bad_from = HashSet::from([