sudachi/dic/
storage.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
/*
 *  Copyright (c) 2021-2024 Works Applications Co., Ltd.
 *
 *  Licensed under the Apache License, Version 2.0 (the "License");
 *  you may not use this file except in compliance with the License.
 *  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 *   Unless required by applicable law or agreed to in writing, software
 *  distributed under the License is distributed on an "AS IS" BASIS,
 *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 *  See the License for the specific language governing permissions and
 *  limitations under the License.
 */

use memmap2::Mmap;
use nom::AsBytes;

pub enum Storage {
    File(Mmap),
    Borrowed(&'static [u8]),
    Owned(Vec<u8>),
}

impl AsRef<[u8]> for Storage {
    fn as_ref(&self) -> &[u8] {
        match self {
            Storage::File(m) => m.as_bytes(),
            Storage::Borrowed(b) => b,
            Storage::Owned(v) => v,
        }
    }
}

pub struct SudachiDicData {
    // system dictionary
    system: Storage,
    // user dictionaries
    user: Vec<Storage>,
}

impl SudachiDicData {
    pub fn new(system: Storage) -> Self {
        Self {
            system,
            user: Vec::new(),
        }
    }

    pub fn add_user(&mut self, user: Storage) {
        self.user.push(user)
    }

    pub fn system(&self) -> &[u8] {
        self.system.as_ref()
    }

    /// # Safety
    /// Call this function only after system dictionary data is ready.
    pub unsafe fn system_static_slice(&self) -> &'static [u8] {
        std::mem::transmute(self.system())
    }

    pub(crate) fn user_static_slice(&self) -> Vec<&'static [u8]> {
        let mut result = Vec::with_capacity(self.user.len());
        for u in self.user.iter() {
            let slice: &'static [u8] = unsafe { std::mem::transmute(u.as_ref()) };
            result.push(slice);
        }
        result
    }
}