#![feature(rustc_macro)] #[macro_use] extern crate serde_derive; extern crate serde_json; extern crate regex; extern crate yaml_rust; extern crate walkdir; use walkdir::{WalkDir, DirEntry}; use std::io::prelude::*; use std::fs::File; use std::env; use std::path::Path; use std::sync::{Arc, Mutex}; use std::thread; mod pre_process; mod section; mod character; use character::Character; mod tags; mod dl_list; mod tiles; static MAX_THREADS: u32 = 12; fn main() { let raw_files = env::var("RAW_FILES").unwrap_or("characters".into()); let out_files = env::var("OUT").unwrap_or("json".into()); let base_path = Path::new(&raw_files); let out_path = Path::new(&out_files); let files: Arc>> = Arc::new(Mutex::new(WalkDir::new(base_path).min_depth(1).into_iter().filter_map(|e| e.ok()).collect())); for 1..MAX_THREADS { std::thread(move || { let entry: Option = None; { entry = files.lock().unwrap().pop(); if entry.is_none() { println!("thread finished"); return; } } let entry = entry.unwrap(); let mut f = File::open(entry.path()).expect("could not open file"); let mut buf = String::new(); if let Err(_) = f.read_to_string(&mut buf) { println!("invalid file: {}", entry.path().to_str().unwrap()); continue; } let buf = pre_process::strip_irrelevant_content(&buf); let mut char = Character::new(); char.parse(&buf); let json = serde_json::to_string(&char).unwrap(); let out_file = out_path.join(entry.file_name().to_str().unwrap().replace("html", "json")); let mut o = File::create(&out_file).unwrap(); o.write_all(json.as_bytes()).unwrap(); println!("{:?}", out_file); }); } }