parent
b34b1e630b
commit
520fbcf317
@ -0,0 +1,141 @@
|
|||||||
|
use std::io::Write;
|
||||||
|
|
||||||
|
use nalgebra::{dvector, DVector};
|
||||||
|
use neuramethyst::derivable::activation::Linear;
|
||||||
|
use neuramethyst::derivable::loss::CrossEntropy;
|
||||||
|
use neuramethyst::derivable::regularize::NeuraL1;
|
||||||
|
use neuramethyst::{plot_losses, prelude::*};
|
||||||
|
|
||||||
|
use rand::Rng;
|
||||||
|
|
||||||
|
fn main() {
|
||||||
|
let mut network = neura_residual![
|
||||||
|
<= 0, 2;
|
||||||
|
neura_layer!("dense", 4).regularization(NeuraL1(0.001));
|
||||||
|
neura_layer!("dropout", 0.25);
|
||||||
|
neura_layer!("dense", 2)
|
||||||
|
.activation(Linear)
|
||||||
|
.regularization(NeuraL1(0.001));
|
||||||
|
neura_layer!("softmax");
|
||||||
|
]
|
||||||
|
.construct(NeuraShape::Vector(2))
|
||||||
|
.unwrap();
|
||||||
|
|
||||||
|
let inputs = (0..1).cycle().map(move |_| {
|
||||||
|
let mut rng = rand::thread_rng();
|
||||||
|
let category = rng.gen_bool(0.5) as usize;
|
||||||
|
let (x, y) = if category == 0 {
|
||||||
|
let radius: f32 = rng.gen_range(0.0..2.0);
|
||||||
|
let angle = rng.gen_range(0.0..std::f32::consts::TAU);
|
||||||
|
(angle.cos() * radius, angle.sin() * radius)
|
||||||
|
} else {
|
||||||
|
let radius: f32 = rng.gen_range(3.0..5.0);
|
||||||
|
let angle = rng.gen_range(0.0..std::f32::consts::TAU);
|
||||||
|
(angle.cos() * radius, angle.sin() * radius)
|
||||||
|
};
|
||||||
|
|
||||||
|
(dvector![x, y], one_hot(category, 2))
|
||||||
|
});
|
||||||
|
|
||||||
|
let test_inputs: Vec<_> = inputs.clone().take(10).collect();
|
||||||
|
|
||||||
|
if std::env::args().any(|arg| arg == "draw") {
|
||||||
|
for epoch in 0..200 {
|
||||||
|
let mut trainer = NeuraBatchedTrainer::new(0.03, 10);
|
||||||
|
trainer.batch_size = 10;
|
||||||
|
|
||||||
|
trainer.train(
|
||||||
|
&NeuraBackprop::new(CrossEntropy),
|
||||||
|
&mut network,
|
||||||
|
inputs.clone(),
|
||||||
|
&test_inputs,
|
||||||
|
);
|
||||||
|
|
||||||
|
draw_neuron_activation(
|
||||||
|
|input| {
|
||||||
|
let output = network.eval(&dvector![input[0] as f32, input[1] as f32]);
|
||||||
|
let estimation = output[0] / (output[0] + output[1]);
|
||||||
|
|
||||||
|
let color = network.eval(&dvector![input[0] as f32, input[1] as f32]);
|
||||||
|
|
||||||
|
(&color / color.map(|x| x * x).sum() * estimation)
|
||||||
|
.into_iter()
|
||||||
|
.map(|x| x.abs() as f64)
|
||||||
|
.collect::<Vec<_>>()
|
||||||
|
},
|
||||||
|
6.0,
|
||||||
|
);
|
||||||
|
println!("{}", epoch);
|
||||||
|
|
||||||
|
std::thread::sleep(std::time::Duration::new(0, 50_000_000));
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
let mut trainer = NeuraBatchedTrainer::new(0.03, 20 * 50);
|
||||||
|
trainer.batch_size = 10;
|
||||||
|
trainer.log_iterations = 20;
|
||||||
|
|
||||||
|
plot_losses(
|
||||||
|
trainer.train(
|
||||||
|
&NeuraBackprop::new(CrossEntropy),
|
||||||
|
&mut network,
|
||||||
|
inputs.clone(),
|
||||||
|
&test_inputs,
|
||||||
|
),
|
||||||
|
128,
|
||||||
|
48,
|
||||||
|
);
|
||||||
|
|
||||||
|
// println!("{}", String::from("\n").repeat(64));
|
||||||
|
// draw_neuron_activation(|input| network.eval(&input).into_iter().collect(), 6.0);
|
||||||
|
}
|
||||||
|
|
||||||
|
let mut file = std::fs::File::create("target/bivariate.csv").unwrap();
|
||||||
|
for (input, _target) in test_inputs {
|
||||||
|
let guess = neuramethyst::argmax(network.eval(&input).as_slice());
|
||||||
|
writeln!(&mut file, "{},{},{}", input[0], input[1], guess).unwrap();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// TODO: move this to the library?
|
||||||
|
fn draw_neuron_activation<F: Fn([f64; 2]) -> Vec<f64>>(callback: F, scale: f64) {
|
||||||
|
use viuer::Config;
|
||||||
|
|
||||||
|
const WIDTH: u32 = 64;
|
||||||
|
const HEIGHT: u32 = 64;
|
||||||
|
|
||||||
|
let mut image = image::RgbImage::new(WIDTH, HEIGHT);
|
||||||
|
|
||||||
|
fn sigmoid(x: f64) -> f64 {
|
||||||
|
1.9 / (1.0 + (-x * 3.0).exp()) - 0.9
|
||||||
|
}
|
||||||
|
|
||||||
|
for y in 0..HEIGHT {
|
||||||
|
let y2 = 2.0 * y as f64 / HEIGHT as f64 - 1.0;
|
||||||
|
for x in 0..WIDTH {
|
||||||
|
let x2 = 2.0 * x as f64 / WIDTH as f64 - 1.0;
|
||||||
|
let activation = callback([x2 * scale, y2 * scale]);
|
||||||
|
let r = (sigmoid(activation.get(0).copied().unwrap_or(-1.0)) * 255.0).floor() as u8;
|
||||||
|
let g = (sigmoid(activation.get(1).copied().unwrap_or(-1.0)) * 255.0).floor() as u8;
|
||||||
|
let b = (sigmoid(activation.get(2).copied().unwrap_or(-1.0)) * 255.0).floor() as u8;
|
||||||
|
|
||||||
|
*image.get_pixel_mut(x, y) = image::Rgb([r, g, b]);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
let config = Config {
|
||||||
|
use_kitty: false,
|
||||||
|
truecolor: true,
|
||||||
|
// absolute_offset: false,
|
||||||
|
..Default::default()
|
||||||
|
};
|
||||||
|
|
||||||
|
viuer::print(&image::DynamicImage::ImageRgb8(image), &config).unwrap();
|
||||||
|
}
|
||||||
|
|
||||||
|
fn one_hot(value: usize, categories: usize) -> DVector<f32> {
|
||||||
|
let mut res = DVector::from_element(categories, 0.0);
|
||||||
|
if value < categories {
|
||||||
|
res[value] = 1.0;
|
||||||
|
}
|
||||||
|
res
|
||||||
|
}
|
@ -0,0 +1,176 @@
|
|||||||
|
use crate::layer::*;
|
||||||
|
use crate::network::*;
|
||||||
|
use crate::utils::unwrap_or_clone;
|
||||||
|
|
||||||
|
use std::borrow::Cow;
|
||||||
|
|
||||||
|
use super::construct::*;
|
||||||
|
use super::*;
|
||||||
|
|
||||||
|
#[derive(Clone, Debug, PartialEq)]
|
||||||
|
pub struct NeuraResidualLast {
|
||||||
|
output_shape: Option<NeuraShape>,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl NeuraResidualLast {
|
||||||
|
#[inline(always)]
|
||||||
|
pub fn new() -> Self {
|
||||||
|
Self { output_shape: None }
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Default for NeuraResidualLast {
|
||||||
|
#[inline(always)]
|
||||||
|
fn default() -> Self {
|
||||||
|
Self::new()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl NeuraResidualConstruct for NeuraResidualLast {
|
||||||
|
type Constructed = NeuraResidualLast;
|
||||||
|
type Err = NeuraResidualConstructErr<(), ()>;
|
||||||
|
|
||||||
|
fn construct_residual(
|
||||||
|
self,
|
||||||
|
input: NeuraResidualInput<NeuraShape>,
|
||||||
|
) -> Result<Self::Constructed, Self::Err> {
|
||||||
|
let input = *input
|
||||||
|
.get_first()
|
||||||
|
.ok_or(Self::Err::AxisErr(NeuraAxisErr::NoInput))?;
|
||||||
|
|
||||||
|
Ok(Self {
|
||||||
|
output_shape: Some(input),
|
||||||
|
})
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl NeuraShapedLayer for NeuraResidualLast {
|
||||||
|
fn output_shape(&self) -> NeuraShape {
|
||||||
|
self.output_shape
|
||||||
|
.expect("Called NeuraResidualLast::output_shape before constructing it")
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl NeuraNetworkBase for NeuraResidualLast {
|
||||||
|
type Layer = ();
|
||||||
|
|
||||||
|
#[inline(always)]
|
||||||
|
fn get_layer(&self) -> &Self::Layer {
|
||||||
|
&()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl NeuraNetworkRec for NeuraResidualLast {
|
||||||
|
type NextNode = ();
|
||||||
|
|
||||||
|
#[inline(always)]
|
||||||
|
fn get_next(&self) -> &Self::NextNode {
|
||||||
|
&()
|
||||||
|
}
|
||||||
|
|
||||||
|
fn merge_gradient(
|
||||||
|
&self,
|
||||||
|
rec_gradient: <Self::NextNode as NeuraTrainableLayerBase>::Gradient,
|
||||||
|
layer_gradient: <Self::Layer as NeuraTrainableLayerBase>::Gradient,
|
||||||
|
) -> Self::Gradient
|
||||||
|
where
|
||||||
|
Self::Layer: NeuraTrainableLayerBase,
|
||||||
|
{
|
||||||
|
todo!()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl<Data: Clone> NeuraNetwork<NeuraResidualInput<Data>> for NeuraResidualLast {
|
||||||
|
type LayerInput = Data;
|
||||||
|
|
||||||
|
type NodeOutput = Data;
|
||||||
|
|
||||||
|
fn map_input<'a>(&'_ self, input: &'a NeuraResidualInput<Data>) -> Cow<'a, Self::LayerInput> {
|
||||||
|
Cow::Owned(unwrap_or_clone(input.clone().get_first().unwrap()))
|
||||||
|
}
|
||||||
|
|
||||||
|
fn map_output<'a>(
|
||||||
|
&'_ self,
|
||||||
|
_input: &'_ NeuraResidualInput<Data>,
|
||||||
|
layer_output: &'a Data,
|
||||||
|
) -> Cow<'a, Self::NodeOutput> {
|
||||||
|
Cow::Borrowed(layer_output)
|
||||||
|
}
|
||||||
|
|
||||||
|
fn map_gradient_in<'a>(
|
||||||
|
&'_ self,
|
||||||
|
_input: &'_ NeuraResidualInput<Data>,
|
||||||
|
gradient_in: &'a Self::NodeOutput,
|
||||||
|
) -> Cow<'a, <Self::Layer as NeuraLayer<Self::LayerInput>>::Output> {
|
||||||
|
Cow::Borrowed(gradient_in)
|
||||||
|
}
|
||||||
|
|
||||||
|
fn map_gradient_out<'a>(
|
||||||
|
&'_ self,
|
||||||
|
input: &'_ NeuraResidualInput<Data>,
|
||||||
|
gradient_in: &'_ Self::NodeOutput,
|
||||||
|
gradient_out: &'a Self::LayerInput,
|
||||||
|
) -> Cow<'a, NeuraResidualInput<Data>> {
|
||||||
|
unimplemented!()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl NeuraTrainableLayerBase for NeuraResidualLast {
|
||||||
|
type Gradient = ();
|
||||||
|
|
||||||
|
#[inline(always)]
|
||||||
|
fn default_gradient(&self) -> Self::Gradient {
|
||||||
|
()
|
||||||
|
}
|
||||||
|
|
||||||
|
#[inline(always)]
|
||||||
|
fn apply_gradient(&mut self, _gradient: &Self::Gradient) {
|
||||||
|
// Noop
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl<Data: Clone> NeuraLayer<NeuraResidualInput<Data>> for NeuraResidualLast {
|
||||||
|
type Output = Data;
|
||||||
|
|
||||||
|
fn eval(&self, input: &NeuraResidualInput<Data>) -> Self::Output {
|
||||||
|
let result: Rc<Self::Output> = input.clone().get_first()
|
||||||
|
.expect("Invalid NeuraResidual state: network returned no data, did you forget to link the last layer?")
|
||||||
|
.into();
|
||||||
|
|
||||||
|
unwrap_or_clone(result)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl<Data: Clone> NeuraTrainableLayerEval<NeuraResidualInput<Data>> for NeuraResidualLast {
|
||||||
|
type IntermediaryRepr = ();
|
||||||
|
|
||||||
|
#[inline(always)]
|
||||||
|
fn eval_training(
|
||||||
|
&self,
|
||||||
|
input: &NeuraResidualInput<Data>,
|
||||||
|
) -> (Self::Output, Self::IntermediaryRepr) {
|
||||||
|
(self.eval(input), ())
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl<Data: Clone> NeuraTrainableLayerSelf<NeuraResidualInput<Data>> for NeuraResidualLast {
|
||||||
|
#[inline(always)]
|
||||||
|
fn regularize_layer(&self) -> Self::Gradient {
|
||||||
|
()
|
||||||
|
}
|
||||||
|
|
||||||
|
#[inline(always)]
|
||||||
|
fn get_gradient(
|
||||||
|
&self,
|
||||||
|
_input: &NeuraResidualInput<Data>,
|
||||||
|
_intermediary: &Self::IntermediaryRepr,
|
||||||
|
_epsilon: &Self::Output,
|
||||||
|
) -> Self::Gradient {
|
||||||
|
()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// let epsilon = Rc::new(epsilon.clone());
|
||||||
|
// let mut epsilon_residual = NeuraResidualInput::new();
|
||||||
|
|
||||||
|
// epsilon_residual.push(0, epsilon);
|
@ -1,11 +1,59 @@
|
|||||||
//! Implementations for NeuraLayer*
|
use nalgebra::{DVector, Scalar};
|
||||||
|
use num::Float;
|
||||||
use std::borrow::Cow;
|
use std::borrow::Cow;
|
||||||
|
|
||||||
use crate::network::*;
|
use crate::network::*;
|
||||||
|
|
||||||
use super::*;
|
use super::*;
|
||||||
|
|
||||||
impl<Axis, Layer, ChildNetwork> NeuraResidualNode<Layer, ChildNetwork, Axis> {
|
#[derive(Clone, Debug, PartialEq)]
|
||||||
|
pub struct NeuraResidualNode<Layer, ChildNetwork, Axis> {
|
||||||
|
pub layer: Layer,
|
||||||
|
pub child_network: ChildNetwork,
|
||||||
|
|
||||||
|
/// Array of relative layers indices to send the offset of this layer to,
|
||||||
|
/// defaults to `vec![0]`.
|
||||||
|
pub(crate) offsets: Vec<usize>,
|
||||||
|
|
||||||
|
pub axis: Axis,
|
||||||
|
|
||||||
|
pub(crate) output_shape: Option<NeuraShape>,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl<Layer, ChildNetwork> NeuraResidualNode<Layer, ChildNetwork, NeuraAxisAppend> {
|
||||||
|
pub fn new(layer: Layer, child_network: ChildNetwork) -> Self {
|
||||||
|
Self {
|
||||||
|
layer,
|
||||||
|
child_network,
|
||||||
|
offsets: vec![0],
|
||||||
|
axis: NeuraAxisAppend,
|
||||||
|
output_shape: None,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl<Layer, ChildNetwork, Axis> NeuraResidualNode<Layer, ChildNetwork, Axis> {
|
||||||
|
pub fn offsets(mut self, offsets: Vec<usize>) -> Self {
|
||||||
|
self.offsets = offsets;
|
||||||
|
self
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn offset(mut self, offset: usize) -> Self {
|
||||||
|
self.offsets.push(offset);
|
||||||
|
self
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn axis<Axis2>(self, axis: Axis2) -> NeuraResidualNode<Layer, ChildNetwork, Axis2> {
|
||||||
|
NeuraResidualNode {
|
||||||
|
layer: self.layer,
|
||||||
|
child_network: self.child_network,
|
||||||
|
offsets: self.offsets,
|
||||||
|
axis,
|
||||||
|
// Drop the knowledge of output_shape
|
||||||
|
output_shape: None,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
fn process_input<Data>(
|
fn process_input<Data>(
|
||||||
&self,
|
&self,
|
||||||
input: &NeuraResidualInput<Data>,
|
input: &NeuraResidualInput<Data>,
|
Loading…
Reference in new issue