1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
use std::sync::Arc;

use arrow::{
    array::Array,
    datatypes::{Field, Schema},
    error::ArrowError,
    record_batch::RecordBatch,
};
use brontes_types::mev::Sandwich;
use itertools::Itertools;

use crate::parquet::{
    normalized_actions::{
        gas_details::{get_gas_details_array, get_gas_details_list_array},
        swaps::get_normalized_swap_list_array,
    },
    utils::{get_list_string_array_from_owned, get_string_array_from_owned},
};

pub fn sandwich_to_record_batch(sandwiches: Vec<Sandwich>) -> Result<RecordBatch, ArrowError> {
    let frontrun_tx_hash_array = get_list_string_array_from_owned(
        sandwiches
            .iter()
            .map(|s| {
                s.frontrun_tx_hash
                    .iter()
                    .map(|hash| hash.to_string())
                    .collect_vec()
            })
            .collect_vec(),
    );

    let frontrun_swaps_array = get_normalized_swap_list_array(
        sandwiches
            .iter()
            .map(|s| s.frontrun_swaps.iter().flatten().collect_vec())
            .collect_vec(),
    );

    let frontrun_gas_details_array = get_gas_details_list_array(
        sandwiches
            .iter()
            .map(|s| &s.frontrun_gas_details)
            .collect_vec(),
    );

    let victim_swaps_tx_hashes_array = get_list_string_array_from_owned(
        sandwiches
            .iter()
            .map(|s| {
                s.victim_swaps_tx_hashes
                    .iter()
                    .flatten()
                    .map(|hash| hash.to_string())
                    .collect_vec()
            })
            .collect_vec(),
    );
    let victim_swaps_array = get_normalized_swap_list_array(
        sandwiches
            .iter()
            .map(|s| s.victim_swaps.iter().flatten().collect_vec())
            .collect_vec(),
    );

    let victim_swaps_gas_details_array = get_gas_details_list_array(
        sandwiches
            .iter()
            .map(|s| &s.victim_swaps_gas_details)
            .collect_vec(),
    );

    let backrun_tx_hash_array = get_string_array_from_owned(
        sandwiches
            .iter()
            .map(|s| Some(s.backrun_tx_hash.to_string()))
            .collect_vec(),
    );

    let backrun_swaps_array = get_normalized_swap_list_array(
        sandwiches
            .iter()
            .map(|s| s.backrun_swaps.iter().collect_vec())
            .collect_vec(),
    );

    let backrun_gas_details_array =
        get_gas_details_array(sandwiches.iter().map(|s| s.backrun_gas_details).collect());

    let schema = Schema::new(vec![
        Field::new("frontrun_tx_hash", frontrun_tx_hash_array.data_type().clone(), false),
        Field::new("frontrun_swaps", frontrun_swaps_array.data_type().clone(), false),
        Field::new("frontrun_gas_details", frontrun_gas_details_array.data_type().clone(), false),
        Field::new(
            "victim_swaps_tx_hashes",
            victim_swaps_tx_hashes_array.data_type().clone(),
            false,
        ),
        Field::new("victim_swaps", victim_swaps_array.data_type().clone(), false),
        Field::new(
            "victim_swaps_gas_details",
            victim_swaps_gas_details_array.data_type().clone(),
            false,
        ),
        Field::new("backrun_tx_hash", backrun_tx_hash_array.data_type().clone(), false),
        Field::new("backrun_swaps", backrun_swaps_array.data_type().clone(), false),
        Field::new("backrun_gas_details", backrun_gas_details_array.data_type().clone(), false),
    ]);

    RecordBatch::try_new(
        Arc::new(schema),
        vec![
            Arc::new(frontrun_tx_hash_array),
            Arc::new(frontrun_swaps_array),
            Arc::new(frontrun_gas_details_array),
            Arc::new(victim_swaps_tx_hashes_array),
            Arc::new(victim_swaps_array),
            Arc::new(victim_swaps_gas_details_array),
            Arc::new(backrun_tx_hash_array),
            Arc::new(backrun_swaps_array),
            Arc::new(backrun_gas_details_array),
        ],
    )
}