about summary refs log tree commit diff stats
path: root/src/storage/video_database/extractor_hash.rs
blob: c956919aacd72f8d178a04c6d33448677d7dbe9c (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
// yt - A fully featured command line YouTube client
//
// Copyright (C) 2024 Benedikt Peetz <benedikt.peetz@b-peetz.de>
// SPDX-License-Identifier: GPL-3.0-or-later
//
// This file is part of Yt.
//
// You should have received a copy of the License along with this program.
// If not, see <https://www.gnu.org/licenses/gpl-3.0.txt>.

use std::{collections::HashMap, fmt::Display, str::FromStr};

use anyhow::{bail, Context, Result};
use blake3::Hash;
use log::debug;
use tokio::sync::OnceCell;

use crate::{app::App, storage::video_database::getters::get_all_hashes};

static EXTRACTOR_HASH_LENGTH: OnceCell<usize> = OnceCell::const_new();

#[derive(Debug, Clone, PartialEq, Eq, Hash)]
pub struct ExtractorHash {
    hash: Hash,
}

impl Display for ExtractorHash {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        self.hash.fmt(f)
    }
}

#[derive(Debug, Clone)]
pub struct ShortHash(String);

impl Display for ShortHash {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        self.0.fmt(f)
    }
}

#[derive(Debug, Clone)]
pub struct LazyExtractorHash {
    value: ShortHash,
}

impl FromStr for LazyExtractorHash {
    type Err = anyhow::Error;

    fn from_str(s: &str) -> std::result::Result<Self, Self::Err> {
        // perform some cheap validation
        if s.len() > 64 {
            bail!("A hash can only contain 64 bytes!");
        }

        Ok(Self {
            value: ShortHash(s.to_owned()),
        })
    }
}

impl LazyExtractorHash {
    /// Turn the [`LazyExtractorHash`] into the [`ExtractorHash`]
    pub async fn realize(self, app: &App) -> Result<ExtractorHash> {
        ExtractorHash::from_short_hash(app, &self.value).await
    }
}

impl ExtractorHash {
    pub fn from_hash(hash: Hash) -> Self {
        Self { hash }
    }
    pub async fn from_short_hash(app: &App, s: &ShortHash) -> Result<Self> {
        Ok(Self {
            hash: Self::short_hash_to_full_hash(app, s).await?,
        })
    }

    pub fn hash(&self) -> &Hash {
        &self.hash
    }

    pub async fn into_short_hash(&self, app: &App) -> Result<ShortHash> {
        let needed_chars = if let Some(needed_chars) = EXTRACTOR_HASH_LENGTH.get() {
            *needed_chars
        } else {
            let needed_chars = self
                .get_needed_char_len(app)
                .await
                .context("Failed to calculate needed char length")?;
            EXTRACTOR_HASH_LENGTH
                .set(needed_chars)
                .expect("This should work at this stage");

            needed_chars
        };

        Ok(ShortHash(
            self.hash()
                .to_hex()
                .chars()
                .take(needed_chars)
                .collect::<String>(),
        ))
    }

    async fn short_hash_to_full_hash(app: &App, s: &ShortHash) -> Result<Hash> {
        let all_hashes = get_all_hashes(app)
            .await
            .context("Failed to fetch all extractor -hashesh from database")?;

        let needed_chars = s.0.len();

        for hash in all_hashes {
            if hash.to_hex()[..needed_chars] == s.0 {
                return Ok(hash);
            }
        }

        bail!("Your shortend hash, does not match a real hash (this is probably a bug)!");
    }

    async fn get_needed_char_len(&self, app: &App) -> Result<usize> {
        debug!("Calculating the needed hash char length");
        let all_hashes = get_all_hashes(app)
            .await
            .context("Failed to fetch all extractor -hashesh from database")?;

        let all_char_vec_hashes = all_hashes
            .into_iter()
            .map(|hash| hash.to_hex().chars().collect::<Vec<char>>())
            .collect::<Vec<Vec<_>>>();

        // This value should be updated later, if not rust will panic in the assertion.
        let mut needed_chars: usize = 1000;
        'outer: for i in 1..64 {
            let i_chars: Vec<String> = all_char_vec_hashes
                .iter()
                .map(|vec| vec.iter().take(i).collect::<String>())
                .collect();

            let mut uniqnes_hashmap: HashMap<String, ()> = HashMap::new();
            for ch in i_chars {
                if let Some(()) = uniqnes_hashmap.insert(ch, ()) {
                    // The key was already in the hash map, thus we have a duplicated char and need
                    // at least one char more
                    continue 'outer;
                }
            }

            needed_chars = i;
            break 'outer;
        }

        assert!(needed_chars <= 64, "Hashes are only 64 bytes long");

        Ok(needed_chars)
    }
}