Color correction and C++ changes

author Max Value <greenwoodw50@gmail.com>

Sun, 11 Jan 2026 23:57:18 +0000 (23:57 +0000)

committer Max Value <greenwoodw50@gmail.com>

Sun, 11 Jan 2026 23:57:18 +0000 (23:57 +0000)
author Max Value <greenwoodw50@gmail.com>
Sun, 11 Jan 2026 23:57:18 +0000 (23:57 +0000)
committer Max Value <greenwoodw50@gmail.com>
Sun, 11 Jan 2026 23:57:18 +0000 (23:57 +0000)
diff --git a/Cargo.toml b/Cargo.toml

index c7bbe3bfadde875ae6398e44e435dfa379fb41a5..aa48132892bcb2a0cf9b8bf4c0c0509ca56b7156 100644 (file)
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -15,6 +15,8 @@ cpal = "0.15.3"
  rscam = "0.5.5"
  npyz = "0.8.4"
  rand = "0.9.2"
+nokhwa = {version = "0.10.10", features = ["input-native"]}
+relative-path = "2.0.1"
  
  [build-dependencies]
  cc = "1.0"
diff --git a/build.rs b/build.rs

index b65310586f7fe728be8455e66163c7f7033c9c4b..016c4c91d06e6bd91a150f1f1a2c4c40621a6da0 100644 (file)
--- a/build.rs
+++ b/build.rs
@@ -1,14 +1,25 @@
  fn main() {
-       println!("cargo::rerun-if-changed=src/perspective.cpp");
+       println!("cargo::rerun-if-changed=src/process.cpp");
+       println!("cargo::rerun-if-changed=src/homography.cpp");
+       println!("cargo::rerun-if-changed=src/color.cpp");
         println!("cargo::rustc-env=CXXFLAGS=-Wunused-parameter -lopencv_core -lopencv_highgui -lopencv_xfeatures2d -lopencv_calib3d -lopencv_videoio -lopencv_imgcodecs -lopencv_imgproc -lopencv_features2d");
  
         cc::Build::new()
-               .file("src/perspective.cpp")
+               .file("src/process.cpp")
                 .cpp(true)
                 .include("/usr/include/opencv4/")
-               .compile("perspective.a");
+
+               // definitions cross language
+               .define("WINDOW_SIZE", "128")
+               .define("CHUNK_SIZE", "72")
+               .define("IMAGE_WIDTH", "1920")
+               .define("IMAGE_HEIGHT", "1080")
+               .define("LUT_SIZE", "12")
+
+               .compile("process.a");
  
         println!("cargo::rustc-flags=-lopencv_core -lopencv_highgui -lopencv_xfeatures2d -lopencv_calib3d -lopencv_videoio -lopencv_imgcodecs -lopencv_imgproc -lopencv_features2d");
  
-       println!("cargo:rustc-env=WGPU_BACKEND=gl") // fix show_image bug(?)
+       println!("cargo:rustc-env=WGPU_BACKEND=gl"); // fix show_image bug(?)
+       println!("cargo:rustc-env=WGPU_POWER_PREF=high"); // can switch to low if performance issues
  }
diff --git a/check.py b/check.py

new file mode 100644 (file)

index 0000000..b6512bd
--- /dev/null
+++ b/check.py
@@ -0,0 +1,25 @@
+import numpy as np
+
+SCALER = (12 - 1) / 255;
+
+def run_color(color, a):
+
+       # at the moment this is how the cpp works too
+       # i think there might actually be something up with the LUT itself
+
+       color = color.astype(np.float64) * SCALER
+
+       floor = np.floor(color).astype(np.uint8)
+       ceil = np.ceil(color).astype(np.uint8)
+       rem = np.remainder(color, 1)
+
+       new_color = a[*floor] + ((a[*ceil] - a[*floor]) * rem)
+       new_color = np.round(new_color).astype(np.uint8)
+
+       print(new_color)
+       quit()
+
+if __name__ == "__main__":
+       a = np.load("./data/cube.npy")
+
+       print(run_color(np.array([79,2,91]), a))
diff --git a/src/barrel.cpp b/src/barrel.cpp

new file mode 100644 (file)

index 0000000..f2af095
--- /dev/null
+++ b/src/barrel.cpp
@@ -0,0 +1,26 @@
+#include "opencv4/opencv2/imgproc.hpp"
+
+using namespace cv;
+
+void ApplyUndistort(uint8_t *camera_ptr, float *xmat_ptr, float *ymat_ptr)
+{
+       Mat xmat (IMAGE_HEIGHT, IMAGE_WIDTH, CV_32F, xmat_ptr);
+       Mat ymat (IMAGE_HEIGHT, IMAGE_WIDTH, CV_32F, ymat_ptr);
+
+       Mat capture(IMAGE_HEIGHT, IMAGE_WIDTH, CV_8UC3, camera_ptr);
+       Mat buffer = capture.clone();
+
+       /* This wont work because the Mats have to be GpuMats, since we're getting a
+        * pointer for them, it might be better to move it all over onto the gpu and
+        * then do the warp transform all at the same time.
+        *
+        * This might be a bit messy.
+        *
+        * Also if im writing CUDA code in cpp and then moving between rust and cpp it
+        * might just be easier to make a lot of the color stuff in rust. Question is is
+        * it more efficient to just do it on the CPU or move it over to the GPU and
+        * then do it there...
+        */
+
+       remap(buffer, capture, xmat, ymat, INTER_NEAREST);
+}
diff --git a/src/color.cpp b/src/color.cpp

new file mode 100644 (file)

index 0000000..82ad0ec
--- /dev/null
+++ b/src/color.cpp
@@ -0,0 +1,83 @@
+#include <cmath>
+#include "opencv4/opencv2/core.hpp"
+#include "opencv4/opencv2/highgui.hpp"
+#include "opencv4/opencv2/xfeatures2d.hpp"
+#include "opencv4/opencv2/calib3d.hpp"
+#include "opencv4/opencv2/imgproc.hpp"
+
+#ifndef LUT_SIZE
+const int LUT_SIZE = 12;
+#endif
+
+using namespace std;
+using namespace cv;
+
+// is this damn well right?!?!
+const float SCALER = ((float)LUT_SIZE - 1.) / 255.;
+
+void ApplyCorrection(uint8_t *buffer_ptr, uint8_t *lut_ptr)
+{
+       try
+       {
+               Mat capture(IMAGE_HEIGHT, IMAGE_WIDTH, CV_8UC3, buffer_ptr);
+
+               MatIterator_<Point3_<uint8_t>> it = capture.begin<Point3_<uint8_t>>();
+               MatIterator_<Point3_<uint8_t>> it_end = capture.end<Point3_<uint8_t>>();
+
+               /*
+                * Pretty sure that because we're not actually using opencv for anything
+                * here, other than some itterator stuff that it might actually have lot
+                * of overhead for, we dont actually need to have the pixels read in bgr
+                * format
+                */
+
+               for (; it != it_end; it++) {
+                       Point3_<uint8_t> pixel = (*it);
+
+                       Point3_<float> scaled (pixel);
+                       scaled *= SCALER;
+
+                       int r = floor(scaled.z);
+                       int g = floor(scaled.y);
+                       int b = floor(scaled.x);
+
+                       int idx = (((LUT_SIZE * LUT_SIZE) * r) + (LUT_SIZE * g)+ b) * 3;
+
+                       uint8_t r_1 = *(lut_ptr + idx + 0);
+                       uint8_t g_1 = *(lut_ptr + idx + 1);
+                       uint8_t b_1 = *(lut_ptr + idx + 2);
+
+                       int offset = 0;
+                       if (r < 253) {
+                               offset += LUT_SIZE * LUT_SIZE * 3;
+                       }
+                       if (g < 253) {
+                               offset += LUT_SIZE * 3;
+                       }
+                       if (b < 253) {
+                               offset += 3;
+                       }
+
+                       uint8_t r_2 = *(lut_ptr + idx + offset + 0);
+                       uint8_t g_2 = *(lut_ptr + idx + offset + 1);
+                       uint8_t b_2 = *(lut_ptr + idx + offset + 2);
+
+                       double n;
+                       // petty sure we can void stuff with null pointers but it
+                       // didnt work when i tried just now
+
+                       double r_w = modf(scaled.z, &n);
+                       double g_w = modf(scaled.y, &n);
+                       double b_w = modf(scaled.x, &n);
+
+                       (*it).z = r_1 + (double)((r_2 - r_1) * r_w);
+                       (*it).y = g_1 + (double)((g_2 - g_1) * g_w);
+                       (*it).x = b_1 + (double)((b_2 - b_1) * b_w);
+               }
+       }
+       catch (const std::exception &e) // handle exceptions for rust
+       {
+               std::cout << "Exception " << e.what() << std::endl;
+       }
+}
+
diff --git a/src/generate_distort.py b/src/generate_distort.py

index 208db87cda7d2631bcab18d0065dbd72c72c47ae..696e84306c2e61f64539629a2f6b661b51143a4a 100644 (file)
--- a/src/generate_distort.py
+++ b/src/generate_distort.py
@@ -47,8 +47,8 @@ newcameramtx, roi = cv.getOptimalNewCameraMatrix(mtx, dist, (w,h), 1, (w,h))
  mapx, mapy = cv.initUndistortRectifyMap(mtx, dist, None, newcameramtx, (w,h), 5)
  dst = cv.remap(img, mapx, mapy, cv.INTER_LINEAR)
  
-full_map = np.stack((mapx, mapy))
-np.save("./data/map.npy", full_map)
+np.save("./data/mapx.npy", mapx)
+np.save("./data/mapy.npy", mapy)
  
  # crop the image
  x, y, w, h = roi
diff --git a/src/generate_lut.py b/src/generate_lut.py

index 4b54ebe08540f633ecf040d6595776778efac73b..d4db011a9462227c0691794dc652eba485554b47 100755 (executable)
--- a/src/generate_lut.py
+++ b/src/generate_lut.py
@@ -2,6 +2,7 @@ from lut.camera import Camera
  from lut.graph import show
  from lut.test import validate
  from lut.cube import Cube
+from lut.config import PASSTHROUGH, CAST_TEST
  
  from numpy import save
  import matplotlib.pyplot as plt
@@ -21,8 +22,10 @@ if __name__ == "__main__":
         show(lut.lut)
  
         # validate error of LUT
-       validate(lut)
  
-       save("../data/cube.npy", lut.lut)
+       if PASSTHROUGH and CAST_TEST:
+               validate(lut)
+
+       save("./data/cube.npy", lut.lut)
  
  
diff --git a/src/homography.cpp b/src/homography.cpp

new file mode 100644 (file)

index 0000000..c68c21b
--- /dev/null
+++ b/src/homography.cpp
@@ -0,0 +1,75 @@
+#include "opencv4/opencv2/xfeatures2d.hpp"
+#include "opencv4/opencv2/calib3d.hpp"
+#include "opencv4/opencv2/imgproc.hpp"
+#include "opencv4/opencv2/imgcodecs.hpp"
+
+using namespace cv;
+using namespace cv::xfeatures2d;
+
+void FuncGetHomography(uint8_t *camera_ptr, double *homography_ptr)
+{
+       try
+       {
+               Mat img1 = imread( samples::findFile("./test/calibration.jpg")/*, IMREAD_GRAYSCALE */);
+               Mat img2(IMAGE_HEIGHT, IMAGE_WIDTH, CV_8UC3, camera_ptr);
+
+               // detect keypoints and compute descriptors
+               int minHessian = 400;
+               Ptr<SURF> detector = SURF::create( minHessian );
+
+               std::vector<KeyPoint> keypoints1, keypoints2;
+               Mat descriptors1, descriptors2;
+               detector->detectAndCompute( img1, noArray(), keypoints1, descriptors1 );
+               detector->detectAndCompute( img2, noArray(), keypoints2, descriptors2 );
+
+               // match descriptors
+               Ptr<DescriptorMatcher> matcher = DescriptorMatcher::create(DescriptorMatcher::FLANNBASED);
+               std::vector< std::vector<DMatch> > knn_matches;
+
+               matcher->knnMatch( descriptors1, descriptors2, knn_matches, 2 );
+
+               // filter matches by the ratio test
+               const float ratio_thresh = 0.7f;
+               std::vector<DMatch> good_matches;
+               for (size_t i = 0; i < knn_matches.size(); i++)
+               {
+                       if (knn_matches[i][0].distance < ratio_thresh * knn_matches[i][1].distance)
+                       {
+                               good_matches.push_back(knn_matches[i][0]);
+                       }
+               }
+
+               // get the source and destination points
+               std::vector<Point2f> source_points, dst_points;
+               for (size_t i = 0; i < good_matches.size(); i++)
+               {
+                       Point2f s_point = keypoints2[good_matches[i].trainIdx].pt;
+                       Point2f d_point = keypoints1[good_matches[i].queryIdx].pt;
+                       source_points.push_back(s_point);
+                       dst_points.push_back(d_point);
+               }
+
+               // perform homography
+               double ransac_thresh = 5.0f;
+               Mat homography = findHomography(source_points, dst_points, RANSAC, ransac_thresh);
+
+               // copy the result to the homography location
+               const double* result_ptr = homography.ptr<double>(0);
+               std::memcpy(homography_ptr, result_ptr, 72); // size of [f64; 9]
+       }
+       catch (const std::exception &e) // handle exceptions for rust
+       {
+               std::cout << "Exception " << e.what() << std::endl;
+       }
+}
+
+void ApplyHomography(uint8_t *camera_ptr, uint8_t *buffer_ptr, double *homography_ptr)
+{
+       Mat capture(IMAGE_HEIGHT, IMAGE_WIDTH, CV_8UC3, camera_ptr);
+       Mat buffer(CHUNK_SIZE, WINDOW_SIZE, CV_8UC3, buffer_ptr);
+       Mat homography(3, 3, CV_64F, homography_ptr);
+
+       warpPerspective(capture, capture, homography, capture.size());
+       resize(capture, buffer, buffer.size());
+}
+
diff --git a/src/image_array.rs b/src/image_array.rs

new file mode 100644 (file)

index 0000000..ae23ca3
--- /dev/null
+++ b/src/image_array.rs
@@ -0,0 +1,179 @@
+use nokhwa::Camera;
+use nokhwa::utils::{RequestedFormat, CameraIndex};
+use nokhwa::pixel_format::RgbFormat;
+
+use rustfft::num_complex::Complex;
+
+use npyz::NpyFile;
+
+use std::io::BufReader;
+use std::fs::File;
+
+use crate::{
+       GetHomography,
+       ProcessCapture,
+       LUT_LENGTH,
+       SPECTOGRAM_AREA,
+       IMAGE_AREA,
+       VOLUME_MIN,
+       VOLUME_REL,
+       AMPLITUDE_REL,
+       AMPLITUDE_MIN,
+       ANGLE_REL,
+       ANGLE_MIN
+};
+
+pub struct ImageArray {
+       pub data: Vec<u8>,
+       homography: [f64; 9],
+       lut: [u8; LUT_LENGTH],
+       camera_buffer: Vec<u8>,
+       camera: Camera,
+       chunks: usize
+}
+
+impl ImageArray {
+       pub fn new (homography: [f64; 9]) -> Self {
+
+               // digest the numpy array and setup lut
+               let file = BufReader::new(File::open("./data/cube.npy").unwrap());
+               let npy = NpyFile::new(file).unwrap();
+
+               // this is a little silly i should handle these things
+               let lut: [u8; LUT_LENGTH] = npy.into_vec().unwrap().try_into().unwrap();
+
+               // setup the camera
+               let index = CameraIndex::Index(0);
+               let requested = RequestedFormat::new::<RgbFormat>(
+                       nokhwa::utils::RequestedFormatType::AbsoluteHighestFrameRate
+               );
+
+               let mut camera = Camera::new(index, requested).unwrap();
+
+               camera.set_resolution(
+                       nokhwa::utils::Resolution { width_x: 1920, height_y: 1080}
+               ).expect("Resolution problem!");
+
+               // self
+               Self {
+                       data: vec![0u8; SPECTOGRAM_AREA * 3],
+                       homography,
+                       lut,
+                       camera_buffer: vec![0u8; IMAGE_AREA],
+                       camera,
+                       chunks: SPECTOGRAM_AREA
+               }
+       }
+
+       pub fn from_camera (&mut self) {
+               let frame = self.camera.frame().unwrap();
+
+               println!("{}", frame.resolution());
+
+               self.camera_buffer = frame.buffer()[..].try_into().expect("Image is wrong size");
+
+               unsafe {
+                       ProcessCapture (
+                               self.camera_buffer.as_ptr() as usize,
+                                                       self.data.as_ptr() as usize,
+                                                       self.homography.as_ptr() as usize,
+                                                       self.lut.as_ptr() as usize
+                       );
+               }
+       }
+
+       pub fn calibrate (&mut self) {
+               // hopefully dont need this !
+               // for _i in 0..10 {
+               //      self.camera_buffer = self.camera.capture().unwrap()[..].try_into().expect("Image is wrong size"); //delete assignment
+               // }
+
+               // enter unsafe and get the homography array
+               unsafe {
+                       GetHomography(self.camera_buffer.as_ptr() as usize, self.homography.as_ptr() as usize);
+               }
+       }
+
+       pub fn from_buffer (&mut self, buffer: &Vec<Complex<f32>>) -> () {
+               let mut r: f32;
+               let mut theta: f32;
+               let mut amplitude: f32;
+
+               let mut hue: f32;
+               let mut angle: f32;
+
+               let mut d:f32;
+               let mut s:f32;
+               let mut v:f32;
+               let mut c:f32;
+               let mut m:f32;
+               let mut x:f32;
+               let mut g:f32;
+               let mut b:f32;
+
+               for i in 0..self.chunks {
+                       (r, theta) = buffer[i].to_polar();
+
+                       // make linear and normalize
+                       amplitude = 20f32 * r.log10();
+                       amplitude = ((amplitude - VOLUME_MIN) / (VOLUME_REL / AMPLITUDE_REL)) + AMPLITUDE_MIN;
+
+                       hue = (180f32 / 255f32) * amplitude;
+
+                       angle = (theta.to_degrees() + 180f32) * (ANGLE_REL / 360f32) + ANGLE_MIN;
+
+                       d = hue * (1f32 / 30f32);
+                       s = angle / 255f32;
+                       v = amplitude / 255f32;
+
+                       c = s * v;
+                       m = v - c;
+                       x = c * (1f32 - (d.rem_euclid(2f32) - 1f32).abs());
+
+                       (r, g, b) = match d.floor() {
+                               0.0 => (c, x, 0f32),
+                               1.0 => (x, c, 0f32),
+                               2.0 => (0f32, c, x),
+                               3.0 => (0f32, x, c),
+                               4.0 => (x, 0f32, c),
+                               _ => (c, 0f32, x)
+                       };
+
+                       self.data[i*3] = ((r + m) * 255f32) as u8;
+                       self.data[i*3+1] = ((g + m) * 255f32) as u8;
+                       self.data[i*3+2] = ((b + m) * 255f32) as u8;
+               }
+       }
+
+       pub fn to_buffer (&mut self, buffer: &mut Vec<Complex<f32>>) -> () {
+               let mut r: f32;
+               let mut amplitude: f32;
+
+               let mut angle: f32;
+
+               let mut s:f32;
+               let mut v:f32;
+               let mut c:f32;
+               let mut g:f32;
+               let mut b:f32;
+
+               for i in 0..self.chunks {
+                       r = self.data[i*3] as f32;
+                       g = self.data[i*3+1] as f32;
+                       b = self.data[i*3+2] as f32;
+
+                       v = r.max(g).max(b);
+                       c = (v - r.min(g).min(b)) * 255f32;
+                       s = if v == 0f32 { 0f32 } else { c / v };
+
+                       amplitude = (v - AMPLITUDE_MIN) * (VOLUME_REL / AMPLITUDE_REL) + VOLUME_MIN;
+
+                       amplitude = 10f32.powf(amplitude / 20f32);
+
+                       angle = (s - ANGLE_MIN) / (ANGLE_REL / 360f32) - 180f32;
+                       angle = angle.to_radians();
+
+                       buffer[i] = Complex::from_polar(amplitude, angle);
+               }
+       }
+}
diff --git a/src/lut/camera.py b/src/lut/camera.py

index 00e96e3ad14b17f6854bea0d5c20c0d00b2a6e43..691d8da7246c3d2d92af5f9507d349e5a763c826 100644 (file)
--- a/src/lut/camera.py
+++ b/src/lut/camera.py
@@ -1,4 +1,4 @@
-from .config import IMAGE_WIDTH, IMAGE_HEIGHT, CAP_WAIT
+from .config import IMAGE_WIDTH, IMAGE_HEIGHT, CAP_WAIT, PASSTHROUGH
  
  import numpy as np
  import cv2 as cv
@@ -11,7 +11,7 @@ class Camera():
                 self.camera = cv.VideoCapture(device)
                 self.homography = None
  
-               #self.calibrate()
+               if not PASSTHROUGH: self.calibrate()
  
         # get image from camera and fix perspective
         def get(self, image):
@@ -19,8 +19,10 @@ class Camera():
                 cv.imshow("LUT Calibration", small)
                 cv.waitKey(CAP_WAIT)
  
-               #_, capture = self.camera.read()
-               capture = image
+               if PASSTHROUGH:
+                       return image
+
+               _, capture = self.camera.read()
  
                 if self.homography is not None:
                         capture = cv.warpPerspective(
@@ -29,7 +31,6 @@ class Camera():
                                 (IMAGE_WIDTH, IMAGE_HEIGHT)
                                 )
  
-               return image
                 return capture
  
         # standard calibration function
diff --git a/src/lut/config.py b/src/lut/config.py

index 980b56231adc836c06b88606537577fa144833d9..0239b42f9282bebf22dc42376733ac9b48fed12d 100644 (file)
--- a/src/lut/config.py
+++ b/src/lut/config.py
@@ -20,3 +20,7 @@ WAIT_TICKS = 100 #s
  
  # how long to wait before capturing image (1 minimum)
  CAP_WAIT = 1
+
+# whether to use the camera or not
+PASSTHROUGH = True
+CAST_TEST = False
diff --git a/src/lut/frame.py b/src/lut/frame.py

index 83ab87f7616366af8d1fc08bbe281cc2e108fb84..d20e27a4dc71686f69e774f3549951a960abe40a 100644 (file)
--- a/src/lut/frame.py
+++ b/src/lut/frame.py
@@ -1,4 +1,4 @@
-from .config import QR_SIZE, QR_PADDING, IMAGE_WIDTH, IMAGE_HEIGHT
+from .config import QR_SIZE, QR_PADDING, IMAGE_WIDTH, IMAGE_HEIGHT, CAST_TEST
  
  from pyzbar.pyzbar import decode
  import numpy as np
@@ -34,7 +34,8 @@ def generate(color):
         qr_image = np.repeat(qr_image[:, :, np.newaxis], 3, axis=2)
         qr_image = cv.resize(qr_image, (QR_SIZE,QR_SIZE), interpolation=cv.INTER_NEAREST)
  
-       color = cast(color)
+       if CAST_TEST:
+               color = cast(color)
  
         # create color image of correct shape
         c_image = np.array([[color[::-1]]], dtype=np.uint8)
diff --git a/src/main.rs b/src/main.rs

index 504b6e6ab45646d9234c544dbda099667694a146..d005d8f9c23165d5d6a532f17f44c81cd5d1ba53 100644 (file)
--- a/src/main.rs
+++ b/src/main.rs
@@ -7,14 +7,14 @@ use cpal::{StreamConfig, BufferSize, SampleRate};
  use cpal::traits::{DeviceTrait, HostTrait, StreamTrait};
  use std::sync::{Arc, Mutex};
  use std::sync::mpsc;
-use std::sync::mpsc::Sender;
-use rscam::{Camera, Config};
  use image::ImageReader;
+use relative_path::RelativePath;
  
-mod correct;
+mod image_array;
+mod sample_buffer;
  
-use crate::correct::Correcter;
-use crate::correct::_cast;
+use image_array::ImageArray;
+use sample_buffer::SampleBuffer;
  
  const WINDOW_SIZE: usize = 128;
  const CHUNK_SIZE: usize = 72;
@@ -24,7 +24,7 @@ const SPECTOGRAM_AREA: usize = WINDOW_SIZE * CHUNK_SIZE;
  const IMAGE_WIDTH: usize = 1920;
  const IMAGE_HEIGHT: usize = 1080;
  const IMAGE_AREA: usize = IMAGE_WIDTH * IMAGE_HEIGHT * 3;
-const FPS: usize = 30;
+// const FPS: usize = 30;
  
  // maximum and minimum pixel values of angle and amplitude. could be confined to
  // improve performance for quiet sounds.
@@ -43,192 +43,17 @@ const VOLUME_MAX: f32 = 65.0; // 60 - 65
  const VOLUME_MIN: f32 = -40.0;
  const VOLUME_REL: f32 = VOLUME_MAX - VOLUME_MIN;
  
+const LUT_SIZE: usize = 12;
+const LUT_LENGTH: usize = LUT_SIZE * LUT_SIZE * LUT_SIZE * 3;
+
  const DEBUG_MODE: bool = true;
  
+const CALIBRATION_PATH: &str = "./test/calibration.jpg";
+const AUDIO_PATH: &str = "/home/will/Downloads/Adducci - Around the Horn.wav";
+
  extern "C" {
    fn GetHomography(camera_ptr: usize, homography_ptr: usize);
-  fn ApplyHomography(camera_ptr: usize, buffer_ptr: usize, homography_ptr: usize);
-}
-
-struct ImageArray {
-       data: Vec<u8>,
-       homography: [f64; 9],
-       corrector: Correcter,
-       camera_buffer: Vec<u8>,
-       camera: Camera,
-       chunks: usize
-}
-
-impl ImageArray {
-       fn new (homography: [f64; 9]) -> Self {
-               let mut array = Self {
-                       data: vec![0u8; SPECTOGRAM_AREA * 3],
-                       homography,
-                       corrector: Correcter::new("./cube.npy"),
-
-                       camera_buffer: vec![0u8; IMAGE_AREA],
-                       camera: Camera::new("/dev/v4l/by-id/usb-MACROSILICON_USB_Video-video-index0").unwrap(), // should be video2
-
-                       chunks: SPECTOGRAM_AREA
-               };
-
-               array.camera.start(&Config {
-                       interval: (1, FPS as u32),
-                       resolution: (IMAGE_WIDTH as u32, IMAGE_HEIGHT as u32),
-                       format: b"RGB3",
-                       ..Default::default()
-               }).unwrap();
-               array
-       }
-
-       fn from_camera (&mut self) {
-               self.camera_buffer = self.camera.capture().unwrap()[..].try_into().expect("Image is wrong size");
-
-               unsafe{ApplyHomography (self.camera_buffer.as_ptr() as usize, self.data.as_ptr() as usize, self.homography.as_ptr() as usize);}
-
-               for i in 0..(self.data.len()-1)/3 {
-                       let mut r = self.data[i*3];
-                       let mut g = self.data[(i*3)+1];
-                       let mut b = self.data[(i*3)+3];
-
-                       [r, g, b] = self.corrector.correct(r, g, b);
-
-                       self.data[i*3] = r;
-                       self.data[(i*3)+1] = g;
-                       self.data[(i*3)+3] = b;
-               }
-       }
-
-       fn calibrate (&mut self) {
-               // rscam gives and empty image if its not prompted a couple times
-               for _i in 0..10 {
-                       self.camera_buffer = self.camera.capture().unwrap()[..].try_into().expect("Image is wrong size"); //delete assignment
-
-               }
-
-               // enter unsafe and get the homography array
-               unsafe {
-                       GetHomography(self.camera_buffer.as_ptr() as usize, self.homography.as_ptr() as usize);
-               }
-       }
-
-       fn from_buffer (&mut self, buffer: &Vec<Complex<f32>>) -> () {
-               let mut r: f32;
-               let mut theta: f32;
-               let mut amplitude: f32;
-
-               let mut hue: f32;
-               let mut angle: f32;
-
-               let mut d:f32;
-               let mut s:f32;
-               let mut v:f32;
-               let mut c:f32;
-               let mut m:f32;
-               let mut x:f32;
-               let mut g:f32;
-               let mut b:f32;
-
-               for i in 0..self.chunks {
-                       (r, theta) = buffer[i].to_polar();
-
-                       // make linear and normalize
-                       amplitude = 20f32 * r.log10();
-                       amplitude = ((amplitude - VOLUME_MIN) / (VOLUME_REL / AMPLITUDE_REL)) + AMPLITUDE_MIN;
-
-                       hue = (180f32 / 255f32) * amplitude;
-
-                       angle = (theta.to_degrees() + 180f32) * (ANGLE_REL / 360f32) + ANGLE_MIN;
-
-                       d = hue * (1f32 / 30f32);
-                       s = angle / 255f32;
-                       v = amplitude / 255f32;
-
-                       c = s * v;
-                       m = v - c;
-                       x = c * (1f32 - (d.rem_euclid(2f32) - 1f32).abs());
-
-                       (r, g, b) = match d.floor() {
-                               0.0 => (c, x, 0f32),
-                               1.0 => (x, c, 0f32),
-                               2.0 => (0f32, c, x),
-                               3.0 => (0f32, x, c),
-                               4.0 => (x, 0f32, c),
-                               _ => (c, 0f32, x)
-                       };
-
-                       self.data[i*3] = ((r + m) * 255f32) as u8;
-                       self.data[i*3+1] = ((g + m) * 255f32) as u8;
-                       self.data[i*3+2] = ((b + m) * 255f32) as u8;
-               }
-       }
-
-       fn to_buffer (&mut self, buffer: &mut Vec<Complex<f32>>) -> () {
-               let mut r: f32;
-               let mut amplitude: f32;
-
-               let mut angle: f32;
-
-               let mut s:f32;
-               let mut v:f32;
-               let mut c:f32;
-               let mut g:f32;
-               let mut b:f32;
-
-               for i in 0..self.chunks {
-                       r = self.data[i*3] as f32;
-                       g = self.data[i*3+1] as f32;
-                       b = self.data[i*3+2] as f32;
-
-                       v = r.max(g).max(b);
-                       c = (v - r.min(g).min(b)) * 255f32;
-                       s = if v == 0f32 { 0f32 } else { c / v };
-
-                       amplitude = (v - AMPLITUDE_MIN) * (VOLUME_REL / AMPLITUDE_REL) + VOLUME_MIN;
-
-                       amplitude = 10f32.powf(amplitude / 20f32);
-
-                       angle = (s - ANGLE_MIN) / (ANGLE_REL / 360f32) - 180f32;
-                       angle = angle.to_radians();
-
-                       buffer[i] = Complex::from_polar(amplitude, angle);
-               }
-       }
-}
-
-struct SampleBuffer {
-       buffer: Arc<Mutex<[i16; 2 * SPECTOGRAM_AREA]>>,
-       index: usize,
-       tx: Sender<bool>
-}
-
-impl SampleBuffer {
-       fn new(buffer: Arc<Mutex<[i16; 2 * SPECTOGRAM_AREA]>>, tx: Sender<bool>) -> Self {
-               Self {
-                       buffer,
-                       index: 0,
-                       tx
-               }
-       }
-
-       fn get_data(&mut self, data: &mut [i16]) {
-               let mut buffer = self.buffer.lock().unwrap();
-               let length = data.len()/2;
-
-               for i in 0..length {
-                       data[i*2] = buffer[i + self.index];
-               }
-
-               self.index += length;
-               if self.index > SPECTOGRAM_AREA {
-                       for i in 0..SPECTOGRAM_AREA {
-                               buffer[i] = buffer[i + SPECTOGRAM_AREA];
-                       }
-                       self.index -= SPECTOGRAM_AREA;
-
-                       let _ = self.tx.send(true);
-               }
-       }
+  fn ProcessCapture(camera_ptr: usize, buffer_ptr: usize, homography_ptr: usize, lut_ptr: usize);
  }
  
  #[show_image::main]
@@ -254,9 +79,12 @@ fn main () -> Result<(), Box<dyn std::error::Error>> {
         // create the debug window
         let debug_window = create_window("Debug", Default::default())?;
  
+       // get calibration image path
+       let calibration_path = RelativePath::new(CALIBRATION_PATH).as_str();
+
         // create window for displaying images and display calibration image
         let display_window = create_window("Display", Default::default())?;
-       let calibration_image = ImageReader::open("src/calibration.jpg")?.decode()?;
+       let calibration_image = ImageReader::open(calibration_path)?.decode()?;
         display_window.set_image("Display", calibration_image)?;
  
  
@@ -272,8 +100,11 @@ fn main () -> Result<(), Box<dyn std::error::Error>> {
         // calibrate camera
         image_array.calibrate();
  
+       // get audio path
+       let audio_path = RelativePath::new(AUDIO_PATH).as_str();
+
         // open audio file
-       let mut reader = hound::WavReader::open("/home/will/Downloads/asq.wav").unwrap();
+       let mut reader = hound::WavReader::open(audio_path).unwrap();
         let file_rate = reader.spec().sample_rate;
  
         // setup audio output and build output stream
diff --git a/src/perspective.cpp b/src/perspective.cpp

deleted file mode 100644 (file)

index 449bfbb..0000000
--- a/src/perspective.cpp
+++ /dev/null
@@ -1,121 +0,0 @@
-// g++ ./perspective.cpp -I/usr/share/include/opencv4/ -lopencv_core -lopencv_calib3d -lopencv_highgui -lopencv_xfeatures2d -lopencv_features2d -lopencv_imgproc -lopencv_videoio -lopencv_imgcodecs -lopencv_features2d -o perspective.a
-//
-#include "opencv4/opencv2/core.hpp"
-#include "opencv4/opencv2/highgui.hpp"
-#include "opencv4/opencv2/xfeatures2d.hpp"
-#include "opencv4/opencv2/calib3d.hpp"
-#include "opencv4/opencv2/imgproc.hpp"
-
-#ifdef CUDA
-#include "opencv4/opencv2/cudawarping.hpp"
-#endif
-
-using namespace cv;
-using namespace cv::xfeatures2d;
-
-const size_t WINDOW_SIZE = 128;
-const size_t CHUNK_SIZE = 72;
-const size_t SPECTOGRAM_AREA = WINDOW_SIZE * CHUNK_SIZE;
-const int FLAT_AREA = SPECTOGRAM_AREA * 3;
-const Size DSIZE_AREA = Size(WINDOW_SIZE, CHUNK_SIZE);
-
-const size_t IMAGE_WIDTH = 1920;
-const size_t IMAGE_HEIGHT = 1080;
-
-extern "C"
-{
-       void GetHomography(uint8_t *camera_ptr, double *homography_ptr)
-       {
-               try
-               {
-                       Mat img1 = imread( samples::findFile("src/calibration.jpg")/*, IMREAD_GRAYSCALE */);
-                       Mat img2(IMAGE_HEIGHT, IMAGE_WIDTH, CV_8UC3, camera_ptr);
-
-                       // detect keypoints and compute descriptors
-                       int minHessian = 400;
-                       Ptr<SURF> detector = SURF::create( minHessian );
-
-                       std::vector<KeyPoint> keypoints1, keypoints2;
-                       Mat descriptors1, descriptors2;
-                       detector->detectAndCompute( img1, noArray(), keypoints1, descriptors1 );
-                       detector->detectAndCompute( img2, noArray(), keypoints2, descriptors2 );
-
-                       // match descriptors
-                       Ptr<DescriptorMatcher> matcher = DescriptorMatcher::create(DescriptorMatcher::FLANNBASED);
-                       std::vector< std::vector<DMatch> > knn_matches;
-
-                       matcher->knnMatch( descriptors1, descriptors2, knn_matches, 2 );
-
-                       // filter matches by the ratio test
-                       const float ratio_thresh = 0.7f;
-                       std::vector<DMatch> good_matches;
-                       for (size_t i = 0; i < knn_matches.size(); i++)
-                       {
-                               if (knn_matches[i][0].distance < ratio_thresh * knn_matches[i][1].distance)
-                               {
-                                       good_matches.push_back(knn_matches[i][0]);
-                               }
-                       }
-
-                       // get the source and destination points
-                       std::vector<Point2f> source_points, dst_points;
-                       for (size_t i = 0; i < good_matches.size(); i++)
-                       {
-                               Point2f s_point = keypoints2[good_matches[i].trainIdx].pt;
-                               Point2f d_point = keypoints1[good_matches[i].queryIdx].pt;
-                               source_points.push_back(s_point);
-                               dst_points.push_back(d_point);
-                       }
-
-                       // perform homography
-                       double ransac_thresh = 5.0f;
-                       Mat homography = findHomography(source_points, dst_points, RANSAC, ransac_thresh);
-
-                       // copy the result to the homography location
-                       const double* result_ptr = homography.ptr<double>(0);
-                       std::memcpy(homography_ptr, result_ptr, 72); // size of [f64; 9]
-               }
-               catch (const std::exception &e) // handle exceptions for rust
-               {
-                       std::cout << "Exception " << e.what() << std::endl;
-               }
-       }
-
-               void ApplyHomography(uint8_t *camera_ptr, uint8_t *buffer_ptr, double *homography_ptr)
-               {
-                       Mat capture(IMAGE_HEIGHT, IMAGE_WIDTH, CV_8UC3, camera_ptr);
-                       Mat buffer(CHUNK_SIZE, WINDOW_SIZE, CV_8UC3, buffer_ptr);
-                       Mat homography(3, 3, CV_64F, homography_ptr);
-
-                       warpPerspective(capture, capture, homography, capture.size());
-                       resize(capture, buffer, buffer.size());
-               }
-
-               void ApplyUndistort(uint8_t *camera_ptr, float *xmat_ptr, float *ymat_ptr)
-               {
-                       Mat xmat (IMAGE_HEIGHT, IMAGE_WIDTH, CV_32F, xmat_ptr);
-                       Mat ymat (IMAGE_HEIGHT, IMAGE_WIDTH, CV_32F, ymat_ptr);
-
-                       Mat capture(IMAGE_HEIGHT, IMAGE_WIDTH, CV_8UC3, camera_ptr);
-                       Mat buffer = capture.clone();
-
-/* This wont work because the Mats have to be GpuMats, since we're getting a
- * pointer for them, it might be better to move it all over onto the gpu and
- * then do the warp transform all at the same time.
- *
- * This might be a bit messy.
- *
- * Also if im writing CUDA code in cpp and then moving between rust and cpp it
- * might just be easier to make a lot of the color stuff in rust. Question is is
- * it more efficient to just do it on the CPU or move it over to the GPU and
- * then do it there...
- */
-
-#ifdef CUDA
-                       cv::cuda::remap(buffer, capture, xmat, ymat, INTER_NEAREST);
-#else
-                       remap(buffer, capture, xmat, ymat, INTER_NEAREST);
-#endif
-               }
-}
-
diff --git a/src/process.cpp b/src/process.cpp

new file mode 100644 (file)

index 0000000..178dfb1
--- /dev/null
+++ b/src/process.cpp
@@ -0,0 +1,34 @@
+#include "barrel.cpp"
+#include "homography.cpp"
+#include "color.cpp"
+
+extern "C"
+{
+       void ProcessCapture(uint8_t *camera_ptr, uint8_t *buffer_ptr, double *homography_ptr, uint8_t *lut_ptr)
+       {
+               /*
+                * Heres the plan:
+                *
+                * We take the image from the camera buffer
+                * Apply the homography to undistort it
+                * Apply the LUT to color correct it
+                * do the FFT to turn it into audio
+                *
+                * This is a lot of new code to write rather than just refactoring old
+                * code. But it will allow us to talk to the GPU a lot better keep
+                * things in one place more.
+                *
+                * It also means that we can compile with explicit cuda support without
+                * even thinking about it in the rust.
+                */
+
+               ApplyHomography(camera_ptr, buffer_ptr, homography_ptr);
+               //ApplyCorrection(buffer_ptr, lut_ptr);
+       }
+
+       // get homography function (see "homography.cpp")
+       void GetHomography(uint8_t *camera_ptr, double *homography_ptr)
+       {
+               FuncGetHomography(camera_ptr, homography_ptr);
+       }
+}
diff --git a/src/sample_buffer.rs b/src/sample_buffer.rs

new file mode 100644 (file)

index 0000000..d808f82
--- /dev/null
+++ b/src/sample_buffer.rs
@@ -0,0 +1,39 @@
+use std::sync::mpsc::Sender;
+use std::sync::{Arc, Mutex};
+
+use crate::SPECTOGRAM_AREA;
+
+pub struct SampleBuffer {
+       buffer: Arc<Mutex<[i16; 2 * SPECTOGRAM_AREA]>>,
+       index: usize,
+       tx: Sender<bool>
+}
+
+impl SampleBuffer {
+       pub fn new(buffer: Arc<Mutex<[i16; 2 * SPECTOGRAM_AREA]>>, tx: Sender<bool>) -> Self {
+               Self {
+                       buffer,
+                       index: 0,
+                       tx
+               }
+       }
+
+       pub fn get_data(&mut self, data: &mut [i16]) {
+               let mut buffer = self.buffer.lock().unwrap();
+               let length = data.len()/2;
+
+               for i in 0..length {
+                       data[i*2] = buffer[i + self.index];
+               }
+
+               self.index += length;
+               if self.index > SPECTOGRAM_AREA {
+                       for i in 0..SPECTOGRAM_AREA {
+                               buffer[i] = buffer[i + SPECTOGRAM_AREA];
+                       }
+                       self.index -= SPECTOGRAM_AREA;
+
+                       let _ = self.tx.send(true);
+               }
+       }
+}
diff --git a/test/example.wav b/test/example.wav

new file mode 100644 (file)

index 0000000..02c44de

Binary files /dev/null and b/test/example.wav differ
diff --git a/todo b/todo

index d66b84c90623a385be57ec7bb8372ac100c438da..f88857ff2bc9f3a2f536d8b5fda53fbc04fc058e 100644 (file)
--- a/todo
+++ b/todo
@@ -1,15 +1,36 @@
  todo:
-- make calibrator for casts on the image
-       - could do this with HSV, i suspect that if we graph changes in HS across
-       the surface of the image, we would see the casts, if they collate with each
-       other then the new "LUT" is x,y,H. this should be simple to build into the
-       current LUT system
-
  - test the lut system in-situ, graph for optimal
-- make the LUT corrector (rust) more efficient (multithreading?)
  - possibly see if a version can be made that takes mic input
  - implement recording for testing
  - implement image display in unused channel
  
  - write cpp code for using cuFFT (not supported by rust-cuda)
  - potentially write rust-cuda kernel for the color conversion
+
+QUICKLY:
+- make functional with windows
+       - some things that might not be windows compatible:
+               - show-image (YES but might need to mess with the backend)
+               - hound for reading the wav files (YES)
+               - cpal for the audio out (YES look into asio extra feature for lower latency)
+               - rscam for the camera (NO drop in for nokhwa) (IMPLEMENTED)
+               - the file paths (IMPLEMENTED)
+- evaluate if cuda is neccicary
+
+LIBRARIES:
+- FFTW (https://www.fftw.org/fftw3_doc/) for the c++
+- nokhwa (IMPLEMENTED)
+- fon
+- rayon
+
+LATENCY:
+- cpal asio
+- reduce the image size
+- gpu support for the c++ code
+
+GPU PERFORMANCE ISSUES:
+- bring down show_image env flag
+
+CAPTURE ISSUES:
+- check nokhwa fps, res, etc
+- reinstate the read loop
author	Max Value <greenwoodw50@gmail.com>
	Sun, 11 Jan 2026 23:57:18 +0000 (23:57 +0000)
committer	Max Value <greenwoodw50@gmail.com>
	Sun, 11 Jan 2026 23:57:18 +0000 (23:57 +0000)
Cargo.toml		patch \| blob \| history
build.rs		patch \| blob \| history
check.py	[new file with mode: 0644]	patch \| blob
src/barrel.cpp	[new file with mode: 0644]	patch \| blob
src/color.cpp	[new file with mode: 0644]	patch \| blob
src/generate_distort.py		patch \| blob \| history
src/generate_lut.py		patch \| blob \| history
src/homography.cpp	[new file with mode: 0644]	patch \| blob
src/image_array.rs	[new file with mode: 0644]	patch \| blob
src/lut/camera.py		patch \| blob \| history
src/lut/config.py		patch \| blob \| history
src/lut/frame.py		patch \| blob \| history
src/main.rs		patch \| blob \| history
src/perspective.cpp	[deleted file]	patch \| blob \| history
src/process.cpp	[new file with mode: 0644]	patch \| blob
src/sample_buffer.rs	[new file with mode: 0644]	patch \| blob
test/example.wav	[new file with mode: 0644]	patch \| blob
todo		patch \| blob \| history