green_copper_runtime/modules/parsers/
mod.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
use csv::Trim;
use quickjs_runtime::builder::QuickJsRuntimeBuilder;
use quickjs_runtime::jsutils::jsproxies::JsProxy;
use quickjs_runtime::jsutils::modules::NativeModuleLoader;
use quickjs_runtime::jsutils::JsError;
use quickjs_runtime::quickjsrealmadapter::QuickJsRealmAdapter;
use quickjs_runtime::quickjsvalueadapter::QuickJsValueAdapter;
use quickjs_runtime::values::JsValueFacade;
use std::str;

struct ParsersModuleLoader {}

impl NativeModuleLoader for ParsersModuleLoader {
    fn has_module(&self, _realm: &QuickJsRealmAdapter, module_name: &str) -> bool {
        module_name.eq("greco://parsers")
    }

    fn get_module_export_names(
        &self,
        _realm: &QuickJsRealmAdapter,
        _module_name: &str,
    ) -> Vec<&str> {
        vec!["CsvParser"]
    }

    fn get_module_exports(
        &self,
        realm: &QuickJsRealmAdapter,
        _module_name: &str,
    ) -> Vec<(&str, QuickJsValueAdapter)> {
        init_exports(realm).expect("init parsers exports failed")
    }
}

pub(crate) fn init(builder: QuickJsRuntimeBuilder) -> QuickJsRuntimeBuilder {
    builder.native_module_loader(ParsersModuleLoader {})
}

fn init_exports(
    realm: &QuickJsRealmAdapter,
) -> Result<Vec<(&'static str, QuickJsValueAdapter)>, JsError> {
    let csv_parser_proxy_class = create_csv_parser_proxy(realm);
    let csv_parser_res = realm.install_proxy(csv_parser_proxy_class, false)?;

    Ok(vec![("CsvParser", csv_parser_res)])
}

pub(crate) fn create_csv_parser_proxy(_realm: &QuickJsRealmAdapter) -> JsProxy {
    JsProxy::new().namespace(&["greco", "parsers"]).name("CsvParser")
        .static_method("parse", |_runtime, realm,  args| {

            // three args, a string or Uint8array for data, a recordCallBack function and an optional options object

            if args.len() < 3 || !(args[0].is_string() || args[0].is_typed_array()) || !args[1].is_function() || !args[2].is_function() {
                Err(JsError::new_str("parse requires 2 or 3 args (data: string | Uint8Array, headersCallBack: (headers: array<string>) => void, recordCallback: (record: array<string>) => void, options: {})"))
            } else {

                // get data, func_ref as JsValueFacade, move to producer

                let data = if args[0].is_string() {
                    args[0].to_string()?
                } else {
                    let buf = realm.copy_typed_array_buffer(&args[0])?;
                    String::from_utf8(buf).map_err(|e| JsError::new_string(format!("{e}")))?
                };
                let cb_h_func = realm.to_js_value_facade(&args[1])?;
                let cb_r_func = realm.to_js_value_facade(&args[2])?;

                realm.create_resolving_promise_async(  async move {

                    let mut rdr = csv::ReaderBuilder::new()
                        .double_quote(true)
                        .delimiter(b',')
                        .has_headers(true)
                        .quoting(true)
                        .flexible(true)
                        //.ascii()
                        .trim(Trim::All)
                        .from_reader(data.as_bytes());

                    let cached_h_function = if let JsValueFacade::JsFunction { cached_function } = cb_h_func { cached_function } else { panic!("function was not a function") };
                    let cached_r_function = if let JsValueFacade::JsFunction { cached_function } = cb_r_func { cached_function } else { panic!("function was not a function") };

                    let headers = rdr.headers().map_err(|e| JsError::new_string(format!("{e}")))?;

                    log::trace!("greco::parsers::CsvParser headers: {:?}", headers);

                    let val: Vec<JsValueFacade> = headers.iter().map(|h| {
                        JsValueFacade::new_str(h)
                    }).collect();

                    let _ = cached_h_function.invoke_function( vec![JsValueFacade::Array {val}]).await;

                    for result in rdr.records() {
                        // The iterator yields Result<StringRecord, Error>, so we check the
                        // error here.
                        let record = result.map_err(|e| JsError::new_string(format!("{e}")))?;

                        // fill val from record
                        let val: Vec<JsValueFacade> = record.iter().map(|h| {
                            JsValueFacade::new_str(h)
                        }).collect();

                        let jsvf_record = JsValueFacade::Array {val};

                        let _ = cached_r_function.invoke_function( vec![jsvf_record]).await;

                        log::trace!("greco::parsers::CsvParser row: {:?}", record);
                    }


                    Ok(())
                }, |realm, _result| {
                    realm.create_null()
                })
            }


        })
}

#[cfg(test)]
pub mod tests {
    use futures::executor::block_on;
    //use log::LevelFilter;
    use quickjs_runtime::builder::QuickJsRuntimeBuilder;
    use quickjs_runtime::jsutils::Script;
    use quickjs_runtime::values::JsValueFacade;

    #[test]
    fn test_csv() {
        //simple_logging::log_to_stderr(log::LevelFilter::Info);

        let builder = QuickJsRuntimeBuilder::new();
        let builder = crate::init_greco_rt(builder);
        let rt = builder.build();

        let script = Script::new(
            "test_parsers.js",
            r#"

        async function test() {
            let parsersMod = await import('greco://parsers');

            let data = '"r 1", "r2", "r3", "r4"\n"a", "b", 1, 2\n"c", "d", 3, 4';

            let ret = "";

            await parsersMod.CsvParser.parse(data, (headers) => {
                console.log("headers: " + headers.join("-"));
                ret += "headers: " + headers.join("-") + "\n";
            }, (row) => {
                console.log("row: " + row.join("-"));
                ret += "row: " + row.join("-") + "\n"

            });
            console.log("parser done");

            return ret;

        }

        test()

        "#,
        );
        let res: JsValueFacade = block_on(rt.eval(None, script)).ok().expect("script failed");

        println!("{}", res.stringify());
        if let JsValueFacade::JsPromise { cached_promise } = res {
            let p_res = block_on(cached_promise.get_promise_result())
                .ok()
                .expect("get prom res failed");
            match p_res {
                Ok(jsvf) => {
                    println!("prom resolved to {}", jsvf.stringify());
                }
                Err(e) => {
                    panic!("prom rejected: {}", e.stringify());
                }
            }
        } else {
            panic!("did not get a promise");
        }
    }
}