Add closest string

This commit is contained in:
hal8174 2024-11-21 22:48:34 +01:00
parent 5a3525a9ce
commit c3cfbcbada
14 changed files with 5399 additions and 0 deletions

237
closest_string/Cargo.lock generated Normal file
View file

@ -0,0 +1,237 @@
# This file is automatically @generated by Cargo.
# It is not intended for manual editing.
version = 3
[[package]]
name = "anstream"
version = "0.6.18"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "8acc5369981196006228e28809f761875c0327210a891e941f4c683b3a99529b"
dependencies = [
"anstyle",
"anstyle-parse",
"anstyle-query",
"anstyle-wincon",
"colorchoice",
"is_terminal_polyfill",
"utf8parse",
]
[[package]]
name = "anstyle"
version = "1.0.10"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "55cc3b69f167a1ef2e161439aa98aed94e6028e5f9a59be9a6ffb47aef1651f9"
[[package]]
name = "anstyle-parse"
version = "0.2.6"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "3b2d16507662817a6a20a9ea92df6652ee4f94f914589377d69f3b21bc5798a9"
dependencies = [
"utf8parse",
]
[[package]]
name = "anstyle-query"
version = "1.1.2"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "79947af37f4177cfead1110013d678905c37501914fba0efea834c3fe9a8d60c"
dependencies = [
"windows-sys",
]
[[package]]
name = "anstyle-wincon"
version = "3.0.6"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "2109dbce0e72be3ec00bed26e6a7479ca384ad226efdd66db8fa2e3a38c83125"
dependencies = [
"anstyle",
"windows-sys",
]
[[package]]
name = "clap"
version = "4.5.21"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "fb3b4b9e5a7c7514dfa52869339ee98b3156b0bfb4e8a77c4ff4babb64b1604f"
dependencies = [
"clap_builder",
"clap_derive",
]
[[package]]
name = "clap_builder"
version = "4.5.21"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "b17a95aa67cc7b5ebd32aa5370189aa0d79069ef1c64ce893bd30fb24bff20ec"
dependencies = [
"anstream",
"anstyle",
"clap_lex",
"strsim",
]
[[package]]
name = "clap_derive"
version = "4.5.18"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "4ac6a0c7b1a9e9a5186361f67dfa1b88213572f427fb9ab038efb2bd8c582dab"
dependencies = [
"heck",
"proc-macro2",
"quote",
"syn",
]
[[package]]
name = "clap_lex"
version = "0.7.3"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "afb84c814227b90d6895e01398aee0d8033c00e7466aca416fb6a8e0eb19d8a7"
[[package]]
name = "closest_string"
version = "0.1.0"
dependencies = [
"clap",
]
[[package]]
name = "colorchoice"
version = "1.0.3"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "5b63caa9aa9397e2d9480a9b13673856c78d8ac123288526c37d7839f2a86990"
[[package]]
name = "heck"
version = "0.5.0"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "2304e00983f87ffb38b55b444b5e3b60a884b5d30c0fca7d82fe33449bbe55ea"
[[package]]
name = "is_terminal_polyfill"
version = "1.70.1"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "7943c866cc5cd64cbc25b2e01621d07fa8eb2a1a23160ee81ce38704e97b8ecf"
[[package]]
name = "proc-macro2"
version = "1.0.91"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "307e3004becf10f5a6e0d59d20f3cd28231b0e0827a96cd3e0ce6d14bc1e4bb3"
dependencies = [
"unicode-ident",
]
[[package]]
name = "quote"
version = "1.0.37"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "b5b9d34b8991d19d98081b46eacdd8eb58c6f2b201139f7c5f643cc155a633af"
dependencies = [
"proc-macro2",
]
[[package]]
name = "strsim"
version = "0.11.1"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "7da8b5736845d9f2fcb837ea5d9e2628564b3b043a70948a3f0b778838c5fb4f"
[[package]]
name = "syn"
version = "2.0.89"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "44d46482f1c1c87acd84dea20c1bf5ebff4c757009ed6bf19cfd36fb10e92c4e"
dependencies = [
"proc-macro2",
"quote",
"unicode-ident",
]
[[package]]
name = "unicode-ident"
version = "1.0.14"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "adb9e6ca4f869e1180728b7950e35922a7fc6397f7b641499e8f3ef06e50dc83"
[[package]]
name = "utf8parse"
version = "0.2.2"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "06abde3611657adf66d383f00b093d7faecc7fa57071cce2578660c9f1010821"
[[package]]
name = "windows-sys"
version = "0.59.0"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "1e38bc4d79ed67fd075bcc251a1c39b32a1776bbe92e5bef1f0bf1f8c531853b"
dependencies = [
"windows-targets",
]
[[package]]
name = "windows-targets"
version = "0.52.6"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "9b724f72796e036ab90c1021d4780d4d3d648aca59e491e6b98e725b84e99973"
dependencies = [
"windows_aarch64_gnullvm",
"windows_aarch64_msvc",
"windows_i686_gnu",
"windows_i686_gnullvm",
"windows_i686_msvc",
"windows_x86_64_gnu",
"windows_x86_64_gnullvm",
"windows_x86_64_msvc",
]
[[package]]
name = "windows_aarch64_gnullvm"
version = "0.52.6"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "32a4622180e7a0ec044bb555404c800bc9fd9ec262ec147edd5989ccd0c02cd3"
[[package]]
name = "windows_aarch64_msvc"
version = "0.52.6"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "09ec2a7bb152e2252b53fa7803150007879548bc709c039df7627cabbd05d469"
[[package]]
name = "windows_i686_gnu"
version = "0.52.6"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "8e9b5ad5ab802e97eb8e295ac6720e509ee4c243f69d781394014ebfe8bbfa0b"
[[package]]
name = "windows_i686_gnullvm"
version = "0.52.6"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "0eee52d38c090b3caa76c563b86c3a4bd71ef1a819287c19d586d7334ae8ed66"
[[package]]
name = "windows_i686_msvc"
version = "0.52.6"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "240948bc05c5e7c6dabba28bf89d89ffce3e303022809e73deaefe4f6ec56c66"
[[package]]
name = "windows_x86_64_gnu"
version = "0.52.6"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "147a5c80aabfbf0c7d901cb5895d1de30ef2907eb21fbbab29ca94c5b08b1a78"
[[package]]
name = "windows_x86_64_gnullvm"
version = "0.52.6"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "24d5b23dc417412679681396f2b49f3de8c1473deb516bd34410872eff51ed0d"
[[package]]
name = "windows_x86_64_msvc"
version = "0.52.6"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "589f6da84c646204747d1270a2a5661ea66ed1cced2631d546fdfb155959f9ec"

View file

@ -0,0 +1,7 @@
[package]
name = "closest_string"
version = "0.1.0"
edition = "2021"
[dependencies]
clap = { version = "4.5.21", features = ["derive"] }

1
closest_string/cs0.out Normal file
View file

@ -0,0 +1 @@
dbadcabbcbaccbabadbb

1
closest_string/cs1.out Normal file
View file

@ -0,0 +1 @@
acdccadadcbadcdbdaaadacbcdcacbbdcdabbbbddbcbccdbabccccdbbacccdccccacaaddcabaaabbbadacbbddaccccbcccbb

1
closest_string/cs2.out Normal file
View file

@ -0,0 +1 @@
cdbdbdbababcdaacbabbdadccdbdcdaacdbaacccddcdbbacadcbcacddcddacdaddcbbacbbddcccdcdbcbacccbabbcbbbaaaa

1
closest_string/cs3.out Normal file
View file

@ -0,0 +1 @@
bcdcacdbbbcbbadbbbaabdadcaddcddabbdacddacaaccadcaabdcdddddadacbdcdcbccabbbabdddbacaddcaacaadacbacbdd

1
closest_string/cs4.out Normal file
View file

@ -0,0 +1 @@
bcdbdcdaabaacdbcddadbddcaabcabaadbbccdcbbdbbbccadcaabcbbcdbbcbbbbccacaabbdcdaccbaaaddccbcdcacdcbcacd

122
closest_string/src/main.rs Normal file
View file

@ -0,0 +1,122 @@
use std::path::{Path, PathBuf};
use clap::{Parser, ValueEnum};
fn read_input(filename: impl AsRef<Path>) -> Vec<Vec<u8>> {
let text = std::fs::read_to_string(filename).unwrap();
let mut r = Vec::new();
for line in text.lines().skip(1) {
r.push(line.as_bytes().to_vec());
}
r
}
fn calculate_hamming_distance(a: &[u8], b: &[u8]) -> usize {
a.iter().zip(b.iter()).filter(|(a, b)| a != b).count()
}
fn simple<'a>(
strings: &[Vec<u8>],
solution: &'a mut [u8],
d: usize,
depth: usize,
) -> Option<&'a [u8]> {
let (s, i) = strings
.iter()
.map(|s| (s, calculate_hamming_distance(s, solution)))
.max_by_key(|(_, i)| *i)
.unwrap();
if i > d + depth {
return None;
} else if i <= d {
return Some(solution);
}
for index in 0..s.len() {
if s[index] != solution[index] {
let temp = solution[index];
solution[index] = s[index];
simple(strings, solution, d, depth + 1)?;
solution[index] = temp;
}
}
None
}
fn closest_string(strings: &[Vec<u8>], d: usize, method: Method) -> Option<Vec<u8>> {
match method {
Method::Simple => {
let mut s = strings[0].clone();
if simple(strings, &mut s, d, 0).is_some() {
Some(s)
} else {
None
}
}
}
}
#[derive(ValueEnum, Debug, Clone, Copy)]
enum Method {
Simple,
}
#[derive(Debug, Parser)]
struct Args {
filename: PathBuf,
d: Option<usize>,
#[clap(default_value = "simple")]
method: Method,
#[clap(short, long)]
reverse: bool,
}
fn main() {
let total_start = std::time::Instant::now();
let args = Args::parse();
let strings = read_input(args.filename);
let result = if let Some(d) = args.d {
let start = std::time::Instant::now();
let r = closest_string(&strings, d, args.method);
eprintln!("{}: {:?}", d, start.elapsed());
r
} else if args.reverse {
let mut d = strings.len();
let mut last_solution = None;
loop {
let start = std::time::Instant::now();
let r = closest_string(&strings, d, args.method);
eprintln!("{}: {:?}", d, start.elapsed());
if let Some(r) = r {
d = r.len() - 1;
last_solution = Some(r);
} else {
break last_solution;
};
}
} else {
let mut d = 0;
loop {
let start = std::time::Instant::now();
let r = closest_string(&strings, d, args.method);
eprintln!("{}: {:?}", d, start.elapsed());
if let Some(r) = r {
break Some(r);
}
d += 1;
}
};
if let Some(solution) = result {
println!("{}", String::from_utf8(solution).unwrap());
}
eprintln!("Total time: {:?}", total_start.elapsed());
}

1001
closest_string/string0.in Normal file

File diff suppressed because it is too large Load diff

1001
closest_string/string1.in Normal file

File diff suppressed because it is too large Load diff

1001
closest_string/string2.in Normal file

File diff suppressed because it is too large Load diff

1001
closest_string/string3.in Normal file

File diff suppressed because it is too large Load diff

1001
closest_string/string4.in Normal file

File diff suppressed because it is too large Load diff

23
closest_string/validator.py Executable file
View file

@ -0,0 +1,23 @@
#!/usr/bin/env python
"""
usage: python3 validator.py path/to/input path/to/vertex/output
"""
import sys
input_file = open(sys.argv[1], "r")
sol_file = open(sys.argv[2], "r")
n = int(input_file.readline().strip())
strings = [l.strip() for l in input_file.readlines()[1:]]
s = sol_file.readline().strip()
if len(s) != len(strings[0]):
print("Lengths of strings do not match")
quit()
dist = max([sum(c1 != c2 for c1, c2 in zip(s, string)) for string in strings])
print("String has max distance {}".format(dist))