Refactor code structure and improve performance by optimizing OpenCL kernel and adding timing macros; update Cargo.toml for release profile settings; enhance main.rs and sinks.rs for better readability and organization.

This commit is contained in:
2025-04-11 16:04:10 +02:00
parent c554b1f164
commit b04c01e737
11 changed files with 395 additions and 184 deletions

View File

@ -15,4 +15,4 @@ opt-level = "z"
codegen-units = 1 codegen-units = 1
[profile.release] [profile.release]
lto = true debug = true

View File

@ -15,35 +15,35 @@
* along with this program. If not, see <https://www.gnu.org/licenses/>. * along with this program. If not, see <https://www.gnu.org/licenses/>.
*/ */
mod types;
mod json_output; mod json_output;
mod sinks; mod sinks;
mod stderr; mod stderr;
mod types;
use std::fmt::Debug; use crate::sinks::{OutputFormat, OutputSink};
use std::io::Write; use crate::stderr::MaschineStdErr;
use clap::{command, Arg, ArgAction, ValueHint}; #[cfg(feature = "sql")]
use std::path::PathBuf; use crate::types::SqlSchematicSupplier;
use std::str::FromStr;
use clap::error::ErrorKind;
use crate::types::{PathSchematicSupplier, SchematicSupplier, SchematicSupplierType}; use crate::types::{PathSchematicSupplier, SchematicSupplier, SchematicSupplierType};
use clap::error::ErrorKind;
use clap::{command, Arg, ArgAction, ValueHint};
#[cfg(feature = "sql")] #[cfg(feature = "sql")]
use futures::executor::block_on; use futures::executor::block_on;
use indicatif::*;
use rayon::prelude::*; use rayon::prelude::*;
use rayon::ThreadPoolBuilder; use rayon::ThreadPoolBuilder;
use schemsearch_common::{Match, SearchBehavior};
use schemsearch_files::SpongeSchematic;
use schemsearch_lib::nbt_search::has_invalid_nbt;
use schemsearch_lib::search::search;
#[cfg(feature = "sql")] #[cfg(feature = "sql")]
use schemsearch_sql::filter::SchematicFilter; use schemsearch_sql::filter::SchematicFilter;
#[cfg(feature = "sql")] #[cfg(feature = "sql")]
use schemsearch_sql::load_all_schematics; use schemsearch_sql::load_all_schematics;
#[cfg(feature = "sql")] use std::fmt::Debug;
use crate::types::SqlSchematicSupplier; use std::io::Write;
use indicatif::*; use std::path::PathBuf;
use schemsearch_common::{Match, SearchBehavior}; use std::str::FromStr;
use schemsearch_files::SpongeSchematic;
use crate::sinks::{OutputFormat, OutputSink};
use crate::stderr::MaschineStdErr;
use schemsearch_lib::nbt_search::has_invalid_nbt;
use schemsearch_lib::search::search;
fn main() { fn main() {
#[allow(unused_mut)] #[allow(unused_mut)]
@ -219,7 +219,9 @@ fn main() {
ignore_air: matches.get_flag("ignore-air"), ignore_air: matches.get_flag("ignore-air"),
air_as_any: matches.get_flag("air-as-any"), air_as_any: matches.get_flag("air-as-any"),
ignore_entities: matches.get_flag("ignore-entities"), ignore_entities: matches.get_flag("ignore-entities"),
threshold: *matches.get_one::<f32>("threshold").expect("Couldn't get threshold"), threshold: *matches
.get_one::<f32>("threshold")
.expect("Couldn't get threshold"),
invalid_nbt: matches.get_flag("invalid-nbt"), invalid_nbt: matches.get_flag("invalid-nbt"),
opencl: matches.get_flag("opencl"), opencl: matches.get_flag("opencl"),
}; };
@ -228,7 +230,11 @@ fn main() {
Some(p) => match SpongeSchematic::load(&PathBuf::from(p)) { Some(p) => match SpongeSchematic::load(&PathBuf::from(p)) {
Ok(x) => Some(x), Ok(x) => Some(x),
Err(e) => { Err(e) => {
cmd.error(ErrorKind::Io, format!("Error while loading Pattern: {}", e.to_string())).exit(); cmd.error(
ErrorKind::Io,
format!("Error while loading Pattern: {}", e.to_string()),
)
.exit();
} }
}, },
None => None, None => None,
@ -269,60 +275,103 @@ fn main() {
} }
for schem in block_on(load_all_schematics(filter)) { for schem in block_on(load_all_schematics(filter)) {
schematics.push(SchematicSupplierType::SQL(SqlSchematicSupplier { schematics.push(SchematicSupplierType::SQL(SqlSchematicSupplier {
node: schem node: schem,
})) }))
}; }
} }
if schematics.is_empty() { if schematics.is_empty() {
cmd.error(ErrorKind::MissingRequiredArgument, "No schematics specified").exit(); cmd.error(
ErrorKind::MissingRequiredArgument,
"No schematics specified",
)
.exit();
} }
let output: Vec<&(OutputFormat, OutputSink)> = matches.get_many::<(OutputFormat, OutputSink)>("output").expect("Error").collect(); let output: Vec<&(OutputFormat, OutputSink)> = matches
let mut output: Vec<(OutputFormat, Box<dyn Write>)> = output.into_iter().map(|x| (x.0.clone(), x.1.output())).collect(); .get_many::<(OutputFormat, OutputSink)>("output")
.expect("Error")
.collect();
let mut output: Vec<(OutputFormat, Box<dyn Write>)> = output
.into_iter()
.map(|x| (x.0.clone(), x.1.output()))
.collect();
for x in &mut output { for x in &mut output {
write!(x.1, "{}", x.0.start(schematics.len() as u32, &search_behavior, start.elapsed().as_millis())).unwrap(); write!(
x.1,
"{}",
x.0.start(
schematics.len() as u32,
&search_behavior,
start.elapsed().as_millis()
)
)
.unwrap();
} }
ThreadPoolBuilder::new().num_threads(*matches.get_one::<usize>("threads").expect("Could not get threads")).build_global().unwrap(); ThreadPoolBuilder::new()
.num_threads(
*matches
.get_one::<usize>("threads")
.expect("Could not get threads"),
)
.build_global()
.unwrap();
let bar = ProgressBar::new(schematics.len() as u64); // "maschine" let bar = ProgressBar::new(schematics.len() as u64); // "maschine"
bar.set_style(ProgressStyle::with_template("[{elapsed}, ETA: {eta}] {wide_bar} {pos}/{len} {per_sec}").unwrap()); bar.set_style(
let term_size = *matches.get_one::<u16>("machine").expect("Could not get machine"); ProgressStyle::with_template("[{elapsed}, ETA: {eta}] {wide_bar} {pos}/{len} {per_sec}")
.unwrap(),
);
let term_size = *matches
.get_one::<u16>("machine")
.expect("Could not get machine");
if term_size != 0 { if term_size != 0 {
bar.set_draw_target(ProgressDrawTarget::term_like(Box::new(MaschineStdErr { size: term_size }))) bar.set_draw_target(ProgressDrawTarget::term_like(Box::new(MaschineStdErr {
size: term_size,
})))
} }
let max_matching = *matches.get_one::<usize>("limit").expect("Could not get max-matching"); let max_matching = *matches
.get_one::<usize>("limit")
.expect("Could not get max-matching");
let matches: Vec<SearchResult> = schematics.par_iter().progress_with(bar).map(|schem| { let matches: Vec<SearchResult> = schematics
match schem { .par_iter()
.progress_with(bar)
.map(|schem| match schem {
SchematicSupplierType::PATH(schem) => { SchematicSupplierType::PATH(schem) => {
let schematic = match load_schem(&schem.path) { let schematic = match load_schem(&schem.path) {
Some(x) => x, Some(x) => x,
None => return SearchResult { None => {
return SearchResult {
name: schem.get_name(), name: schem.get_name(),
matches: Vec::default(), matches: Vec::default(),
} }
}
}; };
search_in_schem(schematic, pattern.as_ref(), search_behavior, schem) search_in_schem(schematic, pattern.as_ref(), search_behavior, schem)
} }
#[cfg(feature = "sql")] #[cfg(feature = "sql")]
SchematicSupplierType::SQL(schem) => { SchematicSupplierType::SQL(schem) => match schem.get_schematic() {
match schem.get_schematic() { Ok(schematic) => {
Ok(schematic) => search_in_schem(schematic, pattern.as_ref(), search_behavior, schem), search_in_schem(schematic, pattern.as_ref(), search_behavior, schem)
}
Err(e) => { Err(e) => {
eprintln!("Error while loading schematic ({}): {}", schem.get_name(), e.to_string()); eprintln!(
"Error while loading schematic ({}): {}",
schem.get_name(),
e.to_string()
);
SearchResult { SearchResult {
name: schem.get_name(), name: schem.get_name(),
matches: Vec::default(), matches: Vec::default(),
} }
} }
} },
} })
} .collect();
}).collect();
let mut matches_count = 0; let mut matches_count = 0;
@ -340,14 +389,18 @@ fn main() {
} }
} }
let end = std::time::Instant::now();
for x in &mut output { for x in &mut output {
write!(x.1, "{}", x.0.end(end.duration_since(start).as_millis())).unwrap(); write!(x.1, "{}", x.0.end(start.elapsed())).unwrap();
x.1.flush().unwrap(); x.1.flush().unwrap();
} }
} }
fn search_in_schem(schematic: SpongeSchematic, pattern: Option<&SpongeSchematic>, search_behavior: SearchBehavior, schem: &impl SchematicSupplier) -> SearchResult { fn search_in_schem(
schematic: SpongeSchematic,
pattern: Option<&SpongeSchematic>,
search_behavior: SearchBehavior,
schem: &impl SchematicSupplier,
) -> SearchResult {
if search_behavior.invalid_nbt { if search_behavior.invalid_nbt {
if has_invalid_nbt(schematic) { if has_invalid_nbt(schematic) {
SearchResult { SearchResult {
@ -377,7 +430,11 @@ fn load_schem(schem_path: &PathBuf) -> Option<SpongeSchematic> {
match SpongeSchematic::load(schem_path) { match SpongeSchematic::load(schem_path) {
Ok(x) => Some(x), Ok(x) => Some(x),
Err(e) => { Err(e) => {
println!("Error while loading schematic ({}): {}", schem_path.to_str().unwrap(), e.to_string()); println!(
"Error while loading schematic ({}): {}",
schem_path.to_str().unwrap(),
e.to_string()
);
None None
} }
} }
@ -388,4 +445,3 @@ struct SearchResult {
name: String, name: String,
matches: Vec<Match>, matches: Vec<Match>,
} }

View File

@ -1,11 +1,11 @@
use std::fs::File; use crate::json_output::{EndEvent, FoundEvent, InitEvent, JsonEvent};
use std::io::BufWriter;
use std::str::FromStr;
use std::io::Write;
use std::time::Duration;
use indicatif::HumanDuration; use indicatif::HumanDuration;
use schemsearch_common::{Match, SearchBehavior}; use schemsearch_common::{Match, SearchBehavior};
use crate::json_output::{EndEvent, FoundEvent, InitEvent, JsonEvent}; use std::fs::File;
use std::io::BufWriter;
use std::io::Write;
use std::str::FromStr;
use std::time::Duration;
#[derive(Debug, Clone)] #[derive(Debug, Clone)]
pub enum OutputSink { pub enum OutputSink {
@ -18,7 +18,7 @@ pub enum OutputSink {
pub enum OutputFormat { pub enum OutputFormat {
Text, Text,
CSV, CSV,
JSON JSON,
} }
impl FromStr for OutputFormat { impl FromStr for OutputFormat {
@ -29,7 +29,7 @@ impl FromStr for OutputFormat {
"text" => Ok(OutputFormat::Text), "text" => Ok(OutputFormat::Text),
"csv" => Ok(OutputFormat::CSV), "csv" => Ok(OutputFormat::CSV),
"json" => Ok(OutputFormat::JSON), "json" => Ok(OutputFormat::JSON),
_ => Err(format!("'{}' is not a valid output format", s)) _ => Err(format!("'{}' is not a valid output format", s)),
} }
} }
} }
@ -41,7 +41,7 @@ impl FromStr for OutputSink {
match s { match s {
"std" => Ok(OutputSink::Stdout), "std" => Ok(OutputSink::Stdout),
"err" => Ok(OutputSink::Stderr), "err" => Ok(OutputSink::Stderr),
_ => Ok(OutputSink::File(s.to_string())) _ => Ok(OutputSink::File(s.to_string())),
} }
} }
} }
@ -51,7 +51,7 @@ impl OutputSink {
match self { match self {
OutputSink::Stdout => Box::new(std::io::stdout()), OutputSink::Stdout => Box::new(std::io::stdout()),
OutputSink::Stderr => Box::new(std::io::stderr()), OutputSink::Stderr => Box::new(std::io::stderr()),
OutputSink::File(path) => Box::new(BufWriter::new(File::create(path).unwrap())) OutputSink::File(path) => Box::new(BufWriter::new(File::create(path).unwrap())),
} }
} }
} }
@ -59,12 +59,21 @@ impl OutputSink {
impl OutputFormat { impl OutputFormat {
pub fn found_match(&self, name: &String, pos: Match) -> String { pub fn found_match(&self, name: &String, pos: Match) -> String {
match self { match self {
OutputFormat::Text => format!("Found match in '{}' at x: {}, y: {}, z: {}, % = {}\n", name, pos.x, pos.y, pos.z, pos.percent), OutputFormat::Text => format!(
OutputFormat::CSV => format!("{},{},{},{},{}\n", name, pos.x, pos.y, pos.z, pos.percent), "Found match in '{}' at x: {}, y: {}, z: {}, % = {}\n",
OutputFormat::JSON => format!("{}\n", serde_json::to_string(&JsonEvent::Found(FoundEvent { name, pos.x, pos.y, pos.z, pos.percent
),
OutputFormat::CSV => {
format!("{},{},{},{},{}\n", name, pos.x, pos.y, pos.z, pos.percent)
}
OutputFormat::JSON => format!(
"{}\n",
serde_json::to_string(&JsonEvent::Found(FoundEvent {
name: name.clone(), name: name.clone(),
match_: pos, match_: pos,
})).unwrap()) }))
.unwrap()
),
} }
} }
@ -72,19 +81,29 @@ impl OutputFormat {
match self { match self {
OutputFormat::Text => format!("Starting search in {} schematics\n", total), OutputFormat::Text => format!("Starting search in {} schematics\n", total),
OutputFormat::CSV => "Name,X,Y,Z,Percent\n".to_owned(), OutputFormat::CSV => "Name,X,Y,Z,Percent\n".to_owned(),
OutputFormat::JSON => format!("{}\n", serde_json::to_string(&JsonEvent::Init(InitEvent { OutputFormat::JSON => format!(
"{}\n",
serde_json::to_string(&JsonEvent::Init(InitEvent {
total, total,
search_behavior: search_behavior.clone(), search_behavior: search_behavior.clone(),
start_time, start_time,
})).unwrap()) }))
.unwrap()
),
} }
} }
pub fn end(&self, end_time: u128) -> String { pub fn end(&self, end_time: Duration) -> String {
match self { match self {
OutputFormat::Text => format!("Search complete in {}\n", HumanDuration(Duration::from_millis(end_time as u64))), OutputFormat::Text => format!("Search complete in {:?}\n", end_time),
OutputFormat::CSV => format!("{}\n", end_time), OutputFormat::CSV => format!("{:?}\n", end_time),
OutputFormat::JSON => format!("{}\n", serde_json::to_string(&JsonEvent::End(EndEvent{ end_time })).unwrap()) OutputFormat::JSON => format!(
"{}\n",
serde_json::to_string(&JsonEvent::End(EndEvent {
end_time: end_time.as_millis()
}))
.unwrap()
),
} }
} }
} }

View File

@ -34,3 +34,14 @@ pub struct Match {
pub z: u16, pub z: u16,
pub percent: f32, pub percent: f32,
} }
#[macro_export]
macro_rules! time {
($name:ident, $body:block) => {{
let start = std::time::Instant::now();
let result = $body;
let duration = start.elapsed();
println!("{} took {:?}", stringify!($name), duration);
result
}};
}

8
schemsearch-lib/src/.idea/modules.xml generated Normal file
View File

@ -0,0 +1,8 @@
<?xml version="1.0" encoding="UTF-8"?>
<project version="4">
<component name="ProjectModuleManager">
<modules>
<module fileurl="file://$PROJECT_DIR$/.idea/src.iml" filepath="$PROJECT_DIR$/.idea/src.iml" />
</modules>
</component>
</project>

8
schemsearch-lib/src/.idea/src.iml generated Normal file
View File

@ -0,0 +1,8 @@
<?xml version="1.0" encoding="UTF-8"?>
<module type="CPP_MODULE" version="4">
<component name="NewModuleRootManager">
<content url="file://$MODULE_DIR$" />
<orderEntry type="inheritedJdk" />
<orderEntry type="sourceFolder" forTests="false" />
</component>
</module>

6
schemsearch-lib/src/.idea/vcs.xml generated Normal file
View File

@ -0,0 +1,6 @@
<?xml version="1.0" encoding="UTF-8"?>
<project version="4">
<component name="VcsDirectoryMappings">
<mapping directory="$PROJECT_DIR$/../.." vcs="Git" />
</component>
</project>

63
schemsearch-lib/src/.idea/workspace.xml generated Normal file
View File

@ -0,0 +1,63 @@
<?xml version="1.0" encoding="UTF-8"?>
<project version="4">
<component name="CMakeSettings">
<configurations>
<configuration PROFILE_NAME="Debug" ENABLED="true" CONFIG_NAME="Debug" />
</configurations>
</component>
<component name="ChangeListManager">
<list default="true" id="352451bc-b368-403e-b1be-bfdcb573471f" name="Changes" comment="">
<change afterPath="$PROJECT_DIR$/../../schemsearch-py/Cargo.toml" afterDir="false" />
<change afterPath="$PROJECT_DIR$/../../schemsearch-py/pyproject.toml" afterDir="false" />
<change afterPath="$PROJECT_DIR$/../../schemsearch-py/src/lib.rs" afterDir="false" />
<change beforePath="$PROJECT_DIR$/../../Cargo.toml" beforeDir="false" afterPath="$PROJECT_DIR$/../../Cargo.toml" afterDir="false" />
<change beforePath="$PROJECT_DIR$/../../SchemSearch.java" beforeDir="false" afterPath="$PROJECT_DIR$/../../SchemSearch.java" afterDir="false" />
</list>
<option name="SHOW_DIALOG" value="false" />
<option name="HIGHLIGHT_CONFLICTS" value="true" />
<option name="HIGHLIGHT_NON_ACTIVE_CHANGELIST" value="false" />
<option name="LAST_RESOLUTION" value="IGNORE" />
</component>
<component name="ClangdSettings">
<option name="formatViaClangd" value="false" />
</component>
<component name="Git.Settings">
<option name="RECENT_GIT_ROOT_PATH" value="$PROJECT_DIR$/../.." />
</component>
<component name="ProjectColorInfo"><![CDATA[{
"customColor": "",
"associatedIndex": 8
}]]></component>
<component name="ProjectId" id="2gFqSldpa6G5CPOKD9Sjp2GUcRW" />
<component name="ProjectViewState">
<option name="hideEmptyMiddlePackages" value="true" />
<option name="showLibraryContents" value="true" />
</component>
<component name="PropertiesComponent"><![CDATA[{
"keyToString": {
"RunOnceActivity.ShowReadmeOnStart": "true",
"RunOnceActivity.cidr.known.project.marker": "true",
"RunOnceActivity.readMode.enableVisualFormatting": "true",
"cf.first.check.clang-format": "false",
"cidr.known.project.marker": "true",
"git-widget-placeholder": "master",
"nodejs_package_manager_path": "npm",
"vue.rearranger.settings.migration": "true"
}
}]]></component>
<component name="SpellCheckerSettings" RuntimeDictionaries="0" Folders="0" CustomDictionaries="0" DefaultDictionary="application-level" UseSingleDictionary="true" transferred="true" />
<component name="TaskManager">
<task active="true" id="Default" summary="Default task">
<changelist id="352451bc-b368-403e-b1be-bfdcb573471f" name="Changes" comment="" />
<created>1715303674752</created>
<option name="number" value="Default" />
<option name="presentableId" value="Default" />
<updated>1715303674752</updated>
<workItem from="1715303675811" duration="8000" />
</task>
<servers />
</component>
<component name="TypeScriptGeneratedFilesManager">
<option name="version" value="3" />
</component>
</project>

View File

@ -1,16 +1,19 @@
use crate::pattern_mapper::{match_palette, match_palette_adapt};
use math::round::ceil; use math::round::ceil;
use schemsearch_common::Match; use schemsearch_common::time;
use schemsearch_common::{Match, SearchBehavior};
use schemsearch_files::SpongeSchematic; use schemsearch_files::SpongeSchematic;
use schemsearch_ocl_matcher::ocl_search; use schemsearch_ocl_matcher::ocl_search;
use crate::{SearchBehavior};
use crate::pattern_mapper::{match_palette, match_palette_adapt};
pub fn search( pub fn search(
schem: SpongeSchematic, schem: SpongeSchematic,
pattern_schem: &SpongeSchematic, pattern_schem: &SpongeSchematic,
search_behavior: SearchBehavior, search_behavior: SearchBehavior,
) -> Vec<Match> { ) -> Vec<Match> {
if schem.width < pattern_schem.width || schem.height < pattern_schem.height || schem.length < pattern_schem.length { if schem.width < pattern_schem.width
|| schem.height < pattern_schem.height
|| schem.length < pattern_schem.length
{
return Vec::new(); return Vec::new();
} }
@ -18,17 +21,27 @@ pub fn search(
return Vec::new(); return Vec::new();
} }
let pattern_schem = match_palette(&schem, &pattern_schem, search_behavior.ignore_block_data); let pattern_schem = time!(match_palette, {
match_palette(&schem, &pattern_schem, search_behavior.ignore_block_data)
});
let mut matches: Vec<Match> = Vec::with_capacity(4); let mut matches: Vec<Match> = Vec::with_capacity(4);
let schem_data = if search_behavior.ignore_block_data { let schem_data = if search_behavior.ignore_block_data {
match_palette_adapt(&schem, &pattern_schem.palette, search_behavior.ignore_block_data) match_palette_adapt(
&schem,
&pattern_schem.palette,
search_behavior.ignore_block_data,
)
} else { } else {
schem.block_data schem.block_data
}; };
let air_id = if search_behavior.ignore_air || search_behavior.air_as_any { pattern_schem.palette.get("minecraft:air").unwrap_or(&-1) } else { &-1}; let air_id = if search_behavior.ignore_air || search_behavior.air_as_any {
pattern_schem.palette.get("minecraft:air").unwrap_or(&-1)
} else {
&-1
};
let pattern_blocks = pattern_schem.block_data.len() as f32; let pattern_blocks = pattern_schem.block_data.len() as f32;
let i_pattern_blocks = pattern_blocks as i32; let i_pattern_blocks = pattern_blocks as i32;
@ -42,29 +55,42 @@ pub fn search(
let schem_length = schem.length as usize; let schem_length = schem.length as usize;
if search_behavior.opencl { if search_behavior.opencl {
return ocl_search(schem_data.as_slice(), [schem_width, schem_height, schem_length], pattern_schem.block_data.as_slice(), [pattern_width, pattern_height, pattern_length], *air_id, search_behavior).unwrap() return time!(ocl_search, {
ocl_search(
schem_data.as_slice(),
[schem_width, schem_height, schem_length],
pattern_schem.block_data.as_slice(),
[pattern_width, pattern_height, pattern_length],
*air_id,
search_behavior,
)
.unwrap()
});
} }
let schem_data = schem_data.as_ptr(); let schem_data = schem_data.as_ptr();
let pattern_data = pattern_schem.block_data.as_ptr(); let pattern_data = pattern_schem.block_data.as_ptr();
let skip_amount = ceil((pattern_blocks * (1.0 - search_behavior.threshold)) as f64, 0) as i32; let skip_amount = ceil(
(pattern_blocks * (1.0 - search_behavior.threshold)) as f64,
0,
) as i32;
for y in 0..=schem_height - pattern_height { for y in 0..=schem_height - pattern_height {
for z in 0..=schem_length - pattern_length { for z in 0..=schem_length - pattern_length {
for x in 0..=schem_width - pattern_width { for x in 0..=schem_width - pattern_width {
let mut not_matching = 0; let mut not_matching = 0;
'outer: 'outer: for j in 0..pattern_height {
for j in 0..pattern_height {
for k in 0..pattern_length { for k in 0..pattern_length {
'inner: 'inner: for i in 0..pattern_width {
for i in 0..pattern_width {
let index = (x + i) + schem_width * ((z + k) + (y + j) * schem_length); let index = (x + i) + schem_width * ((z + k) + (y + j) * schem_length);
let pattern_index = i + pattern_width * (k + j * pattern_length); let pattern_index = i + pattern_width * (k + j * pattern_length);
let data = unsafe { *schem_data.add(index) }; let data = unsafe { *schem_data.add(index) };
let pattern_data = unsafe { *pattern_data.add(pattern_index) }; let pattern_data = unsafe { *pattern_data.add(pattern_index) };
if (search_behavior.ignore_air && data != *air_id) || (search_behavior.air_as_any && pattern_data != *air_id) { if (search_behavior.ignore_air && data != *air_id)
|| (search_behavior.air_as_any && pattern_data != *air_id)
{
continue 'inner; continue 'inner;
} }
if data != pattern_data { if data != pattern_data {

View File

@ -1,47 +1,31 @@
__kernel void add(__global int* result, // Use 3d_img
__global uint* schem, // Weniger Allocs an Buffern
__global uint* pattern, // Pattern Parallelisieren mit Local Workern?
const int p_width, // To Match on GPU
const int p_height, // Weniger Worker, Mehr Parameter!
const int p_depth, // Pattern als Kernel Konstante
const uint air_id,
const int ignore_air, __kernel void add(__global int *result, __global uint *schem,
const int air_as_any, __constant uint *pattern, const int width, const int height,
const int skipamount) { const int depth, const int p_width, const int p_height,
const int p_depth, const uint air_id, const int ignore_air,
const int air_as_any, const int skipamount) {
int x = get_global_id(0); int x = get_global_id(0);
int y = get_global_id(1); int y = get_global_id(2);
int z = get_global_id(2); int z = get_global_id(1);
int width = get_global_size(0);
int height = get_global_size(1);
int depth = get_global_size(2);
if (x > width - p_width || y > height - p_height || z > depth - p_depth) {
return;
}
int wrong_blocks = 0; int wrong_blocks = 0;
for (int py = 0; py < p_height; py++) { for (int py = 0; py < p_height; py++) {
for (int pz = 0; pz < p_depth; pz++) { for (int pz = 0; pz < p_depth; pz++) {
for (int px = 0; px < p_width; px++) { for (int px = 0; px < p_width; px++) {
int s_idx = (x + px) + width * ((z + pz) + (y + py) * depth); // if ((ignore_air && schem_block != air_id) || (air_as_any &&
int p_idx = px + p_width * (pz + py * p_depth); // pattern_block != air_id)) {
// continue; // TODO: PROBLEM!
// }
uint schem_block = schem[s_idx]; wrong_blocks +=
uint pattern_block = pattern[p_idx]; schem[(x + px) + width * ((z + pz) + (y + py) * depth)] !=
pattern[px + p_width * (pz + py * p_depth)];
if ((ignore_air && schem_block != air_id) || (air_as_any && pattern_block != air_id)) {
continue;
}
if (schem_block != pattern_block) {
wrong_blocks++;
if (wrong_blocks > skipamount) {
int idx = x + z * width + y * width * depth;
result[idx] = wrong_blocks;
return;
}
}
} }
} }
} }

View File

@ -1,8 +1,9 @@
use std::sync::OnceLock;
use ocl::{Buffer, MemFlags, ProQue, core};
use ocl::SpatialDims::Three;
use schemsearch_common::{Match, SearchBehavior};
use math::round::ceil; use math::round::ceil;
use ocl::SpatialDims::Three;
use ocl::{core, Buffer, Image, MemFlags, ProQue};
use schemsearch_common::{time, Match, SearchBehavior};
use std::sync::OnceLock;
use std::time;
const KERNEL: &str = include_str!("kernel.cl"); const KERNEL: &str = include_str!("kernel.cl");
@ -20,7 +21,15 @@ pub fn ocl_search(
air_id: i32, air_id: i32,
search_behavior: SearchBehavior, search_behavior: SearchBehavior,
) -> Result<Vec<Match>, String> { ) -> Result<Vec<Match>, String> {
search_ocl(schem, schem_size, pattern, pattern_size, air_id, search_behavior).map_err(|e| e.to_string()) search_ocl(
schem,
schem_size,
pattern,
pattern_size,
air_id,
search_behavior,
)
.map_err(|e| e.to_string())
} }
fn search_ocl( fn search_ocl(
@ -41,56 +50,76 @@ fn search_ocl(
let pattern_blocks = (pattern_width * pattern_height * pattern_length) as f32; let pattern_blocks = (pattern_width * pattern_height * pattern_length) as f32;
let skip_amount = ceil((pattern_blocks * (1.0 - search_behavior.threshold)) as f64, 0) as i32; let skip_amount = ceil(
(pattern_blocks * (1.0 - search_behavior.threshold)) as f64,
0,
) as i32;
let cell = &PRO_QUEU_CELL; let cell = &PRO_QUEU_CELL;
let mut pro_que = cell.get_or_init(|| { let mut pro_que = time!(get_pro_que, {
ProQue::builder() cell.get_or_init(|| ProQue::builder().src(KERNEL).build().unwrap())
.src(KERNEL) .clone()
.build().unwrap() });
}).clone();
pro_que.set_dims(Three(schem_width, schem_length, schem_height));
pro_que.set_dims(Three(schem_width, schem_height, schem_length)); let buffer = time!(create_result_buffer, {
Buffer::builder()
let buffer = Buffer::builder()
.queue(pro_que.queue().clone()) .queue(pro_que.queue().clone())
.flags(MemFlags::new().read_write()) .flags(MemFlags::new().read_write())
.fill_val(-1) .fill_val(-1)
.len(schem.len()) .len(schem.len())
.build()?; .build()
})?;
let schem_buffer = create_schem_buffer(schem, &pro_que)?; let schem_buffer = time!(create_schen_buffer, {
create_schem_buffer(schem, &pro_que)
})?;
let pattern_buffer = create_schem_buffer(pattern, &pro_que)?; let pattern_buffer = time!(create_pattern_buffer, {
create_schem_buffer(pattern, &pro_que)
})?;
let kernel = pro_que.kernel_builder("add") let kernel = time!(create_kernel, {
pro_que
.kernel_builder("add")
.arg(&buffer) .arg(&buffer)
.arg(&schem_buffer) .arg(&schem_buffer)
.arg(&pattern_buffer) .arg(&pattern_buffer)
.arg(schem_width as i32)
.arg(schem_height as i32)
.arg(schem_length as i32)
.arg(pattern_width as i32) .arg(pattern_width as i32)
.arg(pattern_height as i32) .arg(pattern_height as i32)
.arg(pattern_length as i32) .arg(pattern_length as i32)
.arg(air_id) // air_id .arg(air_id)
.arg(search_behavior.ignore_air as u32) // ignore_air .arg(search_behavior.ignore_air as u32)
.arg(search_behavior.air_as_any as u32) // air_as_any .arg(search_behavior.air_as_any as u32)
.arg(skip_amount) .arg(skip_amount)
.build()?; .build()
})?;
unsafe { kernel.enq()?; } unsafe {
time!(run_kernel, { kernel.enq() })?;
}
let mut vec = vec![0i32; buffer.len()]; let mut vec = vec![0; buffer.len()];
time!(read_buffer, {
buffer.read(&mut vec).enq()?; buffer.read(&mut vec).enq()?;
});
Ok(vec.into_iter().enumerate().filter(|(_, v)| *v < skip_amount && *v != -1).map(|(i, v)| { Ok(vec
Match { .into_iter()
.enumerate()
.filter(|(_, v)| *v < skip_amount && *v != -1)
.map(|(i, v)| Match {
x: (i % schem_width) as u16, x: (i % schem_width) as u16,
y: ((i / (schem_width * schem_length)) % schem_height) as u16, y: ((i / (schem_width * schem_length)) % schem_height) as u16,
z: ((i / schem_width) % schem_length) as u16, z: ((i / schem_width) % schem_length) as u16,
percent: (pattern_blocks - v as f32) / pattern_blocks, percent: (pattern_blocks - v as f32) / pattern_blocks,
} })
}).collect()) .collect())
} }
fn create_schem_buffer(pattern: &[i32], pro_que: &ProQue) -> ocl::Result<Buffer<i32>> { fn create_schem_buffer(pattern: &[i32], pro_que: &ProQue) -> ocl::Result<Buffer<i32>> {
@ -98,6 +127,7 @@ fn create_schem_buffer(pattern: &[i32], pro_que: &ProQue) -> ocl::Result<Buffer<
.queue(pro_que.queue().clone()) .queue(pro_que.queue().clone())
.flags(MemFlags::new().read_only()) .flags(MemFlags::new().read_only())
.len(pattern.len()) .len(pattern.len())
// Host Memory Map?
.copy_host_slice(pattern) .copy_host_slice(pattern)
.build() .build()
} }