chalkydri/subsys/
capriltags.rs

1//!
2//! Subsystem for the official AprilTags C library
3//!
4
5// TODO: implement this
6// There's actually already a decent Rust binding we can use.
7// There's an example here: <https://github.com/jerry73204/apriltag-rust/blob/master/apriltag/examples/detector.rs>
8//
9// <https://www.chiefdelphi.com/t/frc-blog-technology-updates-past-present-future-and-beyond-apriltags-and-new-radio/440931>
10// According to this post on CD, we're doing the 36h11 tag family now.
11
12use std::collections::HashMap;
13
14use apriltag::{Detector, Family, Image, TagParams};
15use camera_intrinsic_model::{GenericModel, OpenCVModel5};
16use gstreamer::ElementFactory;
17use gstreamer::prelude::GstBinExtManual;
18use gstreamer::{Buffer, Caps, Element};
19use minint::NtConn;
20use rapier3d::math::{Matrix, Rotation, Translation};
21use rapier3d::na::Quaternion;
22#[cfg(feature = "rerun")]
23use re_sdk::external::re_types_core;
24#[cfg(feature = "rerun")]
25use re_types::{
26    archetypes::{Boxes2D, Points2D},
27    components::{PinholeProjection, PoseRotationQuat, Position2D, ViewCoordinates},
28};
29use std::time::Instant;
30use tokio::sync::watch;
31
32use crate::Cfg;
33use crate::calibration::CalibratedModel;
34use crate::{Subsystem, config, subsystem::frame_proc_loop};
35
36const TAG_SIZE: f64 = 0.1651;
37
38pub struct CApriltagsDetector {
39    det: apriltag::Detector,
40    layout: HashMap<u64, (Translation<f64>, Rotation<f64>)>,
41    model: CalibratedModel,
42    name: String,
43}
44impl Subsystem for CApriltagsDetector {
45    const NAME: &'static str = "capriltags";
46
47    type Config = config::CAprilTagsSubsys;
48    type Output = ();
49    type Error = Box<dyn std::error::Error + Send>;
50
51    fn preproc(
52        cam_config: config::Camera,
53        pipeline: &gstreamer::Pipeline,
54    ) -> Result<(gstreamer::Element, gstreamer::Element), Self::Error> {
55        let config = cam_config.subsystems.capriltags;
56        // The AprilTag preprocessing part:
57        //  tee ! gamma ! videoconvertscale ! capsfilter ! appsink
58
59        // Create the elements
60        let videoconvertscale = ElementFactory::make("videoconvertscale").build().unwrap();
61        let filter = ElementFactory::make("capsfilter")
62            .property(
63                "caps",
64                &Caps::builder("video/x-raw")
65                    .field("width", &1280)
66                    .field("height", &720)
67                    .field("format", "GRAY8")
68                    .build(),
69            )
70            .build()
71            .unwrap();
72
73        // Add them to the pipeline
74        pipeline.add_many([&videoconvertscale, &filter]).unwrap();
75
76        // Link them
77        Element::link_many([&videoconvertscale, &filter]).unwrap();
78
79        Ok((videoconvertscale, filter))
80    }
81    async fn init(cam_config: config::Camera) -> Result<Self, Self::Error> {
82        let model = CalibratedModel::new(cam_config.calib.unwrap());
83
84        let subsys_cfg = cam_config.subsystems.capriltags;
85        let default_layout = AprilTagFieldLayout {
86            tags: Vec::new(),
87            field: Field {
88                width: 0.0,
89                length: 0.0,
90            },
91        };
92        let layouts = Cfg.read().await.field_layouts.clone().unwrap();
93        let layout = layouts
94            .get(&subsys_cfg.field_layout.unwrap_or_default())
95            .unwrap_or(&default_layout);
96        let layout = AprilTagFieldLayout::load(layout);
97        let det = Detector::builder()
98            .add_family_bits(Family::tag_36h11(), 3)
99            .build()
100            .unwrap();
101
102        Ok(Self {
103            model,
104            layout,
105            det,
106            name: cam_config.id,
107        })
108    }
109    async fn process(
110        &mut self,
111        nt: NtConn,
112        rx: watch::Receiver<Option<Buffer>>,
113    ) -> Result<Self::Output, Self::Error> {
114        let cam_name = self.name.clone();
115
116        // Publish NT topics we'll use
117        let mut translation = nt
118            .publish::<Vec<f64>>(&format!("/chalkydri/robot_pose/{cam_name}/translation"))
119            .await
120            .unwrap();
121        let mut rotation = nt
122            .publish::<Vec<f64>>(&format!("/chalkydri/robot_pose/{cam_name}/rotation"))
123            .await
124            .unwrap();
125        let mut delay = nt
126            .publish::<f64>(&format!("/chalkydri/robot_pose/{cam_name}/delay"))
127            .await
128            .unwrap();
129        let mut tag_detected = nt
130            .publish::<bool>(&format!("/chalkydri/robot_pose/{cam_name}/tag_detected"))
131            .await
132            .unwrap();
133
134        debug!("running frame processing loop...");
135        frame_proc_loop(rx, async |frame| {
136            let proc_st_time = Instant::now();
137
138            if let Ok(buf) = frame.into_mapped_buffer_readable() {
139                debug!("loading image...");
140                let img = unsafe { Image::from_luma8(1280, 720, buf.as_ptr() as *mut _).unwrap() };
141
142                let dets = self.det.detect(&img);
143
144                let poses: Vec<_> = dets
145                    .iter()
146                    .filter_map(|det| {
147                        // Extract camera calibration values from the [CalibratedModel]
148                        let OpenCVModel5 { fx, fy, cx, cy, .. } =
149                            if let GenericModel::OpenCVModel5(model) = self.model.inner_model() {
150                                model
151                            } else {
152                                panic!("camera model type not supported yet");
153                            };
154
155                        // Estimate tag pose with the camera calibration values
156                        let pose = det
157                            .estimate_tag_pose(&TagParams {
158                                fx,
159                                fy,
160                                cx,
161                                cy,
162                                tagsize: TAG_SIZE,
163                            })
164                            .unwrap();
165
166                        // Extract the camera's translation and rotation matrices from the [Pose]
167                        let cam_translation = pose.translation().data().to_vec();
168                        let cam_rotation = pose.rotation().data().to_vec();
169
170                        // Convert the camera's translation and rotation matrices into proper Rust datatypes
171                        let cam_translation = Translation::new(
172                            cam_translation[0],
173                            cam_translation[1],
174                            cam_translation[2],
175                        );
176                        let cam_rotation = Rotation::from_matrix(&Matrix::from_vec(cam_rotation));
177
178                        debug!(
179                            "detected tag id {}: tl={cam_translation} ro={cam_rotation}",
180                            det.id()
181                        );
182
183                        // Try to get the tag's pose from the field layout
184                        if let Some((tag_translation, tag_rotation)) =
185                            self.layout.get(&(det.id() as u64))
186                        {
187                            let translation = tag_translation * cam_translation;
188                            let rotation = tag_rotation * cam_rotation;
189                            return Some((translation, rotation, det.decision_margin() as f64));
190                        }
191
192                        None
193                    })
194                    .collect();
195
196                if poses.len() > 0 {
197                    let mut avg_translation = Translation::new(0.0f64, 0.0, 0.0);
198                    let mut avg_rotation = Quaternion::new(0.0f64, 0.0, 0.0, 0.0);
199
200                    for pose in poses.iter() {
201                        avg_translation.x += pose.0.x;
202                        avg_translation.y += pose.0.y;
203                        avg_translation.z += pose.0.z;
204
205                        avg_rotation.w += pose.1.w;
206                        avg_rotation.i += pose.1.i;
207                        avg_rotation.j += pose.1.j;
208                        avg_rotation.k += pose.1.k;
209                    }
210
211                    avg_translation.x /= poses.len() as f64;
212                    avg_translation.x /= poses.len() as f64;
213                    avg_translation.x /= poses.len() as f64;
214
215                    avg_rotation.w /= poses.len() as f64;
216                    avg_rotation.i /= poses.len() as f64;
217                    avg_rotation.j /= poses.len() as f64;
218                    avg_rotation.k /= poses.len() as f64;
219
220                    let t = avg_translation.vector.data.as_slice().to_vec();
221                    let r = avg_rotation.vector().data.into_slice().to_vec();
222
223                    debug!("tag detected : {t:?} / {r:?}");
224
225                    translation.set(t).await;
226                    rotation.set(r).await;
227                    tag_detected.set(true).await;
228                    delay.set(proc_st_time.elapsed().as_millis_f64()).await;
229                } else {
230                    debug!("no tag detected");
231                    tag_detected.set(false).await;
232                }
233            }
234        })
235        .await;
236        debug!("loop done?");
237
238        Ok(())
239    }
240}
241
242#[derive(Default, Debug, Clone, PartialEq, Serialize, Deserialize)]
243#[cfg_attr(feature = "web", derive(utopia::ToSchema))]
244#[serde(rename_all = "camelCase")]
245pub struct AprilTagFieldLayout {
246    pub tags: Vec<LayoutTag>,
247    pub field: Field,
248}
249impl AprilTagFieldLayout {
250    pub fn load(&self) -> HashMap<u64, (Translation<f64>, Rotation<f64>)> {
251        let mut tags = HashMap::new();
252        for LayoutTag {
253            id,
254            pose:
255                LayoutPose {
256                    translation,
257                    rotation: LayoutRotation { quaternion },
258                },
259        } in self.tags.clone()
260        {
261            // Turn the field layout values into Rust datatypes
262            let tag_translation = Translation::new(translation.x, translation.y, translation.z);
263            let tag_rotation = Rotation::from_quaternion(Quaternion::new(
264                quaternion.w,
265                quaternion.x,
266                quaternion.y,
267                quaternion.z,
268            ));
269
270            tags.insert(id as u64, (tag_translation, tag_rotation));
271        }
272
273        tags
274    }
275}
276
277#[derive(Default, Debug, Clone, PartialEq, Serialize, Deserialize)]
278#[cfg_attr(feature = "web", derive(utopia::ToSchema))]
279#[serde(rename_all = "camelCase")]
280pub struct LayoutTag {
281    #[serde(rename = "ID")]
282    pub id: i64,
283    pub pose: LayoutPose,
284}
285
286#[derive(Default, Debug, Clone, Copy, PartialEq, Serialize, Deserialize)]
287#[cfg_attr(feature = "web", derive(utopia::ToSchema))]
288#[serde(rename_all = "camelCase")]
289pub struct LayoutPose {
290    pub translation: LayoutTranslation,
291    pub rotation: LayoutRotation,
292}
293
294#[derive(Default, Debug, Clone, Copy, PartialEq, Serialize, Deserialize)]
295#[cfg_attr(feature = "web", derive(utopia::ToSchema))]
296#[serde(rename_all = "camelCase")]
297pub struct LayoutTranslation {
298    pub x: f64,
299    pub y: f64,
300    pub z: f64,
301}
302
303#[derive(Default, Debug, Clone, Copy, PartialEq, Serialize, Deserialize)]
304#[cfg_attr(feature = "web", derive(utopia::ToSchema))]
305#[serde(rename_all = "camelCase")]
306pub struct LayoutRotation {
307    pub quaternion: LayoutQuaternion,
308}
309
310#[derive(Default, Debug, Clone, Copy, PartialEq, Serialize, Deserialize)]
311#[cfg_attr(feature = "web", derive(utopia::ToSchema))]
312#[serde(rename_all = "camelCase")]
313pub struct LayoutQuaternion {
314    #[serde(rename = "W")]
315    pub w: f64,
316    #[serde(rename = "X")]
317    pub x: f64,
318    #[serde(rename = "Y")]
319    pub y: f64,
320    #[serde(rename = "Z")]
321    pub z: f64,
322}
323
324#[derive(Default, Debug, Clone, Copy, PartialEq, Serialize, Deserialize)]
325#[cfg_attr(feature = "web", derive(utopia::ToSchema))]
326#[serde(rename_all = "camelCase")]
327pub struct Field {
328    pub length: f64,
329    pub width: f64,
330}