Name: cli-music
Author: rawgroundbeef

cli-music | Skills Pool

TMPDIR=$(mktemp -d)
BPM=85; BEAT=0.706; BAR=$(echo "$BEAT * 4" | bc); DUR=60

# Pad — detuned chord
sox -n -r 44100 "$TMPDIR/pad.wav" synth $DUR sawtooth 220 sawtooth 220.8 sawtooth 261.63 sawtooth 262.4 sawtooth 329.63 sawtooth 330.4 chorus 0.6 0.9 40 0.4 0.25 2 lowpass 700 reverb 50 gain -12

# Bass — root note
sox -n -r 44100 "$TMPDIR/bass.wav" synth $DUR sawtooth 110 lowpass 350 gain -8

# Kick
sox -n -r 44100 "$TMPDIR/kick.wav" synth 0.3 sine 160:45 fade t 0.005 0.3 0.2 gain -3

# Texture — pink noise bed
ffmpeg -y -f lavfi -i "anoisesrc=color=pink:d=$DUR:s=44100" -af "lowpass=f=3000,highpass=f=200,volume=0.04" "$TMPDIR/texture.wav"

# Loop kick to fill duration
sox "$TMPDIR/kick.wav" "$TMPDIR/kick_bar.wav" repeat 3
ffmpeg -y -stream_loop $(echo "$DUR / ($BAR)" | bc) -i "$TMPDIR/kick_bar.wav" -t $DUR -c copy "$TMPDIR/kick_full.wav"

# Mix and export
ffmpeg -y -i "$TMPDIR/pad.wav" -i "$TMPDIR/bass.wav" -i "$TMPDIR/kick_full.wav" -i "$TMPDIR/texture.wav" \
  -filter_complex "[0][1][2][3]amix=inputs=4:normalize=0,loudnorm=I=-16:TP=-1.5:LRA=11,afade=t=in:d=3,afade=t=out:st=57:d=3" \
  -ar 44100 -ac 2 -codec:a libmp3lame -b:a 192k track.mp3

rm -rf "$TMPDIR"
ffprobe -v error -show_entries format=duration,bit_rate -show_entries stream=sample_rate,channels,codec_name -of default=noprint_wrappers=1 track.mp3

Tool	Install	Use for
ffmpeg	Usually pre-installed	Mixing, filter graphs, MP3 encoding, `aevalsrc` expression synthesis
SoX	`brew install sox` / `apt install sox`	Waveform synthesis (native sawtooth/square/triangle/pluck), effects, sequencing
ffprobe	Bundled with ffmpeg	Verifying output (duration, bitrate, format)

TMPDIR=$(mktemp -d)
# Generate layers into $TMPDIR/
# Mix layers
# Export final MP3
# Clean up: rm -rf "$TMPDIR"

beat_duration = 60 / BPM

BPM	Whole (s)	Half (s)	Quarter (s)	Eighth (s)	Sixteenth (s)
80	3.000	1.500	0.750	0.375	0.1875
90	2.667	1.333	0.667	0.333	0.167
100	2.400	1.200	0.600	0.300	0.150
110	2.182	1.091	0.545	0.273	0.136
120	2.000	1.000	0.500	0.250	0.125
130	1.846	0.923	0.462	0.231	0.115
140	1.714	0.857	0.429	0.214	0.107

Note	Oct 2	Oct 3	Oct 4	Oct 5	Oct 6
C	65.41	130.81	261.63	523.25	1046.50
C#	69.30	138.59	277.18	554.37	1108.73
D	73.42	146.83	293.66	587.33	1174.66
D#	77.78	155.56	311.13	622.25	1244.51
E	82.41	164.81	329.63	659.26	1318.51
F	87.31	174.61	349.23	698.46	1396.91
F#	92.50	185.00	369.99	739.99	1479.98
G	98.00	196.00	392.00	783.99	1567.98
G#	103.83	207.65	415.30	830.61	1661.22
A	110.00	220.00	440.00	880.00	1760.00
A#	116.54	233.08	466.16	932.33	1864.66
B	123.47	246.94	493.88	987.77	1975.53

Type	Intervals	Example (C4)
Major triad	root, M3, P5	261.63, 329.63, 392.00
Minor triad	root, m3, P5	261.63, 311.13, 392.00
Major 7th	root, M3, P5, M7	261.63, 329.63, 392.00, 493.88
Minor 7th	root, m3, P5, m7	261.63, 311.13, 392.00, 466.16
Dominant 7th	root, M3, P5, m7	261.63, 329.63, 392.00, 466.16

saw(f,t) = sin(f*2*PI*t) - sin(2*f*2*PI*t)/2 + sin(3*f*2*PI*t)/3 - sin(4*f*2*PI*t)/4 + sin(5*f*2*PI*t)/5

sq(f,t) = sin(f*2*PI*t) + sin(3*f*2*PI*t)/3 + sin(5*f*2*PI*t)/5 + sin(7*f*2*PI*t)/7

sin(f * (1 + 0.004*sin(5*2*PI*t)) * 2*PI*t)

(sin(f*2*PI*t) + sin((f+0.8)*2*PI*t)) / 2

# A2 sawtooth bass with 5 harmonics
ffmpeg -y -f lavfi -i "aevalsrc='\
  (sin(110*2*PI*t)-sin(220*2*PI*t)/2+sin(330*2*PI*t)/3-sin(440*2*PI*t)/4+sin(550*2*PI*t)/5)/3 \
':s=44100:d=2" out.wav

# A4 square-ish lead with vibrato
ffmpeg -y -f lavfi -i "aevalsrc='\
  (sin(440*(1+0.004*sin(5*2*PI*t))*2*PI*t)+sin(1320*2*PI*t)/3+sin(2200*2*PI*t)/5+sin(3080*2*PI*t)/7)/2 \
':s=44100:d=2" out.wav

# Fast attack (0.01s), exponential decay
ffmpeg -y -f lavfi -i "aevalsrc='sin(440*2*PI*t) * min(t/0.01, 1) * exp(-3*t)':s=44100:d=2" out.wav

# C major chord with detuned pairs — sounds full, not thin
ffmpeg -y -f lavfi -i "aevalsrc='\
  (sin(261.63*2*PI*t)+sin(262.4*2*PI*t) + sin(329.63*2*PI*t)+sin(330.4*2*PI*t) + sin(392*2*PI*t)+sin(392.8*2*PI*t))/6 \
':s=44100:d=2" out.wav

# Play 4 notes in sequence, each 0.5s, looping every 2s
# C4 -> E4 -> G4 -> C5
ffmpeg -y -f lavfi -i "aevalsrc='\
  sin(261.63*2*PI*t)*between(mod(t,2),0,0.5) + \
  sin(329.63*2*PI*t)*between(mod(t,2),0.5,1.0) + \
  sin(392.00*2*PI*t)*between(mod(t,2),1.0,1.5) + \
  sin(523.25*2*PI*t)*between(mod(t,2),1.5,2.0) \
':s=44100:d=8" out.wav

# Each note gets its own attack/release envelope
# mt = position within the current 0.5s slot
ffmpeg -y -f lavfi -i "aevalsrc='\
  sin(261.63*2*PI*t) * between(mod(t,2),0,0.5) * min(mod(t,0.5)/0.01,1) * min((0.5-mod(t,0.5))/0.01,1) + \
  sin(329.63*2*PI*t) * between(mod(t,2),0.5,1.0) * min((mod(t,2)-0.5)/0.01,1) * min((1.0-mod(t,2))/0.01,1) + \
  sin(392.00*2*PI*t) * between(mod(t,2),1.0,1.5) * min((mod(t,2)-1.0)/0.01,1) * min((1.5-mod(t,2))/0.01,1) + \
  sin(523.25*2*PI*t) * between(mod(t,2),1.5,2.0) * min((mod(t,2)-1.5)/0.01,1) * min((2.0-mod(t,2))/0.01,1) \
':s=44100:d=8" out.wav

# White noise (hihats)
ffmpeg -y -f lavfi -i "anoisesrc=color=white:d=0.1:s=44100" hihat.wav

# Pink noise (snare body)
ffmpeg -y -f lavfi -i "anoisesrc=color=pink:d=0.2:s=44100" snare_body.wav

ffmpeg -y -f lavfi -i "aevalsrc='\
  0.9*sin(2*PI*(160*exp(-8*t)+45)*t)*exp(-4*t) \
  + 0.4*sin(2*PI*(80*exp(-15*t)+30)*t)*exp(-3*t) \
':s=44100:d=0.4" -af "lowpass=f=200,volume=1.5" kick.wav

# Tone body (~200Hz, fast decay)
ffmpeg -y -f lavfi -i "aevalsrc='0.6*sin(200*2*PI*t)*exp(-15*t)':s=44100:d=0.25" snare_tone.wav
# Noise crack (pink noise, bandpassed, shaped)
ffmpeg -y -f lavfi -i "anoisesrc=color=pink:d=0.2:s=44100" \
  -af "bandpass=f=1200:width_type=h:w=2000,afade=t=in:d=0.001,afade=t=out:st=0.05:d=0.15,volume=0.8" snare_noise.wav
# Layer them
ffmpeg -y -i snare_tone.wav -i snare_noise.wav -filter_complex "[0][1]amix=inputs=2:normalize=0" snare.wav

ffmpeg -y -f lavfi -i "anoisesrc=color=white:d=0.08:s=44100" \
  -af "highpass=f=7000,bandpass=f=10000:width_type=h:w=4000,afade=t=out:st=0.015:d=0.065,volume=0.35" hihat.wav

ffmpeg -y -f lavfi -i "anoisesrc=color=white:d=0.2:s=44100" \
  -af "highpass=f=6000,bandpass=f=9000:width_type=h:w=5000,afade=t=out:st=0.05:d=0.15,volume=0.25" openhat.wav

# Sawtooth A4 for 2 seconds — one command vs 5-line aevalsrc expression
sox -n -r 44100 out.wav synth 2 sawtooth 440

# C major chord — three sawtooth oscillators summed
sox -n -r 44100 out.wav synth 2 sawtooth 261.63 sawtooth 329.63 sawtooth 392

# 4-note melody: C4 → E4 → G4 → C5, each 0.5s
sox -n -r 44100 out.wav synth 0.5 sawtooth 261.63 : synth 0.5 sawtooth 329.63 : synth 0.5 sawtooth 392 : synth 0.5 sawtooth 523.25

# Sine sweep 160→45Hz with fade — replaces the complex aevalsrc kick recipe
sox -n -r 44100 kick.wav synth 0.3 sine 160:45 fade t 0.005 0.3 0.2 gain -3

# Karplus-Strong pluck — great for lo-fi guitar sounds, not possible with ffmpeg
sox -n -r 44100 pluck.wav synth 1.5 pluck 220 fade t 0.005 1.5 0.5

# Effects chain left-to-right after filename
sox in.wav out.wav reverb 50 chorus 0.6 0.9 40 0.4 0.25 2 lowpass 800 gain -2

Effect	Usage	Example
`reverb`	Room ambience (30–80 useful range)	`reverb 50`
`chorus`	Stereo widening	`chorus 0.6 0.9 40 0.4 0.25 2`
`overdrive`	Harmonic saturation (5–10 subtle, 20+ aggressive)	`overdrive 10`
`lowpass`	Warmth	`lowpass 800`
`highpass`	Clarity for non-bass	`highpass 200`
`tremolo`	Amplitude modulation	`tremolo 5 60`
`fade`	Fade in/out	`fade t 2 60 3`
`gain`	Volume in dB	`gain -3`

# Mix files (sum)
sox -m melody.wav bass.wav mix.wav

# Concatenate files
sox bar.wav bar.wav bar.wav long.wav

# Repeat a bar 30 times (29 additional plays)
sox in.wav out.wav repeat 29

# Trim to exact duration
sox in.wav out.wav trim 0 2.824

Task	SoX	ffmpeg
Sawtooth/square/triangle tone	`synth 2 sawtooth 440`	5-line `aevalsrc` harmonic series
Kick drum (freq sweep)	`synth 0.3 sine 160:45`	`aevalsrc` with `exp()` sweep
Plucked string sound	`synth 1.5 pluck 220`	Not practical
Reverb	`reverb 50` — simple, good	`aecho` — workable but not true reverb
Complex time-sequenced patterns	Clunky `:` concat syntax	`between(mod(t,...))` — flexible
Place hits at exact ms positions	Not supported	`adelay` + `amix`
Mix 5+ layers with per-layer volume	Possible but awkward	`amix=normalize=0` + `volume` per input
Final MP3 encode + loudnorm	No MP3 encoding	`libmp3lame` + `loudnorm`

BPM=120
BEAT_MS=500  # 60000/120

# Kick on beats 1 and 3 (0ms and 1000ms)
# Snare on beats 2 and 4 (500ms and 1500ms)
# Hihat on every eighth note (0, 250, 500, 750, 1000, 1250, 1500, 1750)

ffmpeg -y \
  -f lavfi -i "aevalsrc='sin(2*PI*(150*exp(-10*t))*t)*exp(-5*t)':s=44100:d=0.3" \
  -f lavfi -i "anoisesrc=color=pink:d=0.15:s=44100" \
  -f lavfi -i "anoisesrc=color=white:d=0.05:s=44100" \
  -filter_complex "\
    [0]asplit=2[k1][k2]; \
    [1]asplit=2[s1][s2]; \
    [2]asplit=8[h1][h2][h3][h4][h5][h6][h7][h8]; \
    [k1]adelay=0|0[dk1]; [k2]adelay=1000|1000[dk2]; \
    [s1]adelay=500|500,highpass=f=200,bandpass=f=300:width_type=h:w=200[ds1]; \
    [s2]adelay=1500|1500,highpass=f=200,bandpass=f=300:width_type=h:w=200[ds2]; \
    [h1]adelay=0|0,highpass=f=8000[dh1]; \
    [h2]adelay=250|250,highpass=f=8000[dh2]; \
    [h3]adelay=500|500,highpass=f=8000[dh3]; \
    [h4]adelay=750|750,highpass=f=8000[dh4]; \
    [h5]adelay=1000|1000,highpass=f=8000[dh5]; \
    [h6]adelay=1250|1250,highpass=f=8000[dh6]; \
    [h7]adelay=1500|1500,highpass=f=8000[dh7]; \
    [h8]adelay=1750|1750,highpass=f=8000[dh8]; \
    [dk1][dk2][ds1][ds2][dh1][dh2][dh3][dh4][dh5][dh6][dh7][dh8]amix=inputs=12:normalize=0,volume=0.8,apad=whole_dur=2 \
  " -t 2 drum_bar.wav

# Loop a 2-second bar to fill 60 seconds
ffmpeg -y -stream_loop 29 -i drum_bar.wav -t 60 -c copy drums_full.wav

# Square-ish melody with vibrato, 4 notes at 120 BPM
# Pattern: C5, D5, E5, C5 — each note has attack/release envelope
ffmpeg -y -f lavfi -i "aevalsrc='\
  (sin(523.25*(1+0.004*sin(5*2*PI*t))*2*PI*t)+sin(1569.75*2*PI*t)/3+sin(2616.25*2*PI*t)/5)*0.3 \
  * between(mod(t,2),0,0.5) * min(mod(t,2)/0.015,1) * min((0.5-mod(t,2))/0.04,1) + \
  (sin(587.33*(1+0.004*sin(5*2*PI*t))*2*PI*t)+sin(1761.99*2*PI*t)/3+sin(2936.65*2*PI*t)/5)*0.3 \
  * between(mod(t,2),0.5,1.0) * min((mod(t,2)-0.5)/0.015,1) * min((1.0-mod(t,2))/0.04,1) + \
  (sin(659.26*(1+0.004*sin(5*2*PI*t))*2*PI*t)+sin(1977.78*2*PI*t)/3+sin(3296.3*2*PI*t)/5)*0.3 \
  * between(mod(t,2),1.0,1.5) * min((mod(t,2)-1.0)/0.015,1) * min((1.5-mod(t,2))/0.04,1) + \
  (sin(523.25*(1+0.004*sin(5*2*PI*t))*2*PI*t)+sin(1569.75*2*PI*t)/3+sin(2616.25*2*PI*t)/5)*0.3 \
  * between(mod(t,2),1.5,2.0) * min((mod(t,2)-1.5)/0.015,1) * min((2.0-mod(t,2))/0.04,1) \
':s=44100:d=2" -af "lowpass=f=2500,tremolo=f=3:d=0.3,volume=0.55" melody_bar.wav

# Sawtooth bass following chord roots at 120 BPM, with plucky envelope
ffmpeg -y -f lavfi -i "aevalsrc='\
  (sin(130.81*2*PI*t)-sin(261.62*2*PI*t)/2+sin(392.43*2*PI*t)/3-sin(523.24*2*PI*t)/4+sin(654.05*2*PI*t)/5)/3 \
  * between(mod(t,2),0,0.45) * min(mod(t,0.5)/0.008,1) * exp(-1.2*mod(t,0.5)) + \
  (sin(130.81*2*PI*t)-sin(261.62*2*PI*t)/2+sin(392.43*2*PI*t)/3-sin(523.24*2*PI*t)/4+sin(654.05*2*PI*t)/5)/3 \
  * between(mod(t,2),0.5,0.95) * min((mod(t,2)-0.5)/0.008,1) * exp(-1.2*(mod(t,2)-0.5)) + \
  (sin(146.83*2*PI*t)-sin(293.66*2*PI*t)/2+sin(440.49*2*PI*t)/3-sin(587.32*2*PI*t)/4)/3 \
  * between(mod(t,2),1.0,1.45) * min((mod(t,2)-1.0)/0.008,1) * exp(-1.2*(mod(t,2)-1.0)) + \
  (sin(130.81*2*PI*t)-sin(261.62*2*PI*t)/2+sin(392.43*2*PI*t)/3-sin(523.24*2*PI*t)/4+sin(654.05*2*PI*t)/5)/3 \
  * between(mod(t,2),1.5,1.95) * min((mod(t,2)-1.5)/0.008,1) * exp(-1.2*(mod(t,2)-1.5)) \
':s=44100:d=2" -af "lowpass=f=350,volume=0.7" bass_bar.wav

# Warm pad: detuned pairs + chorus + echo + lowpass
ffmpeg -y -f lavfi -i "aevalsrc='\
  (sin(261.63*2*PI*t)+sin(262.4*2*PI*t) + sin(329.63*2*PI*t)+sin(330.4*2*PI*t) + sin(392*2*PI*t)+sin(392.8*2*PI*t)) / 6 \
  * (0.6 + 0.4*sin(0.15*2*PI*t)) \
':s=44100:d=8" \
  -af "lowpass=f=800,chorus=0.6:0.9:40|55|70:0.4|0.35|0.3:0.25|0.3|0.35:2|1.5|2.5,aecho=0.8:0.7:90:0.25,volume=0.3" pad.wav

# Lo-fi room noise: pink noise, bandpassed, very quiet
ffmpeg -y -f lavfi -i "anoisesrc=color=pink:d=60:s=44100" \
  -af "lowpass=f=3000,highpass=f=200,volume=0.04" vinyl_texture.wav

Filter	Usage	Example
`volume`	Per-layer level balance	`volume=0.6`
`lowpass`	Cut highs (warmth, taming harmonics)	`lowpass=f=800`
`highpass`	Cut lows (clarity for non-bass)	`highpass=f=200`
`afade`	Fade in/out (prevent abrupt start/end)	`afade=t=in:d=2`, `afade=t=out:st=58:d=2`
`amix`	Mix multiple streams	`amix=inputs=4:normalize=0`
`apad`	Pad with silence (fix amix truncation)	`apad=whole_dur=2.824`
`loudnorm`	EBU R128 loudness normalization	`loudnorm=I=-16:TP=-1.5:LRA=11`

Filter	Usage	Example
`chorus`	Stereo width / thickening (essential for pads)	`chorus=0.6:0.9:40\|55\|70:0.4\|0.35\|0.3:0.25\|0.3\|0.35:2\|1.5\|2.5`
`aecho`	Space / depth (pads, ambient)	`aecho=0.8:0.7:90\|250:0.25\|0.15`
`tremolo`	Amplitude movement (melody, pads)	`tremolo=f=3:d=0.3`
`bandpass`	Isolate frequency band (drums, snare)	`bandpass=f=1000:width_type=h:w=500`
`adelay`	Place drum hits in time (ms, per-channel)	`adelay=500\|500`

Filter	Usage	Example
`flanger`	Sweeping modulation (leads, synths)	`flanger=delay=3:depth=2:speed=0.5`
`vibrato`	Pitch modulation (as filter, not in-expr)	`vibrato=f=5:d=0.4`
`areverse`	Reverse audio (FX, risers)	`areverse`
`atempo`	Change speed	`atempo=0.5` (half speed)

ffmpeg -y \
  -i melody_full.wav \
  -i bass_full.wav \
  -i drums_full.wav \
  -i pad_full.wav \
  -i vinyl_texture.wav \
  -filter_complex "\
    [0][1][2][3][4]amix=inputs=5:normalize=0,\
    loudnorm=I=-16:TP=-1.5:LRA=11\
  " \
  -ar 44100 -ac 2 mix.wav

ffmpeg -y -i mix.wav -codec:a libmp3lame -b:a 192k -ar 44100 -ac 2 output.mp3

ffprobe -v error -show_entries format=duration,bit_rate,format_name -show_entries stream=sample_rate,channels,codec_name -of default=noprint_wrappers=1 output.mp3

# Create a file list
echo "file 'intro.wav'" > list.txt
echo "file 'verse.wav'" >> list.txt
echo "file 'chorus.wav'" >> list.txt
echo "file 'outro.wav'" >> list.txt

ffmpeg -y -f concat -safe 0 -i list.txt -c copy full_track.wav

# Fade in first 3 seconds, fade out last 3 seconds of a 60s track
ffmpeg -y -i full_track.wav -af "afade=t=in:d=3,afade=t=out:st=57:d=3" full_track_faded.wav

Genre	Integrated (I)	True Peak (TP)	LRA
Ambient	-18	-2.0	11
Lo-fi / Chill	-16	-1.5	11
Electronic	-14	-1.5	9
Techno / EDM	-14	-1.5	9

cli-music

cli-music

Quick Recipe

Overview & Constraints

Rhythm & Timing Math

Note Frequency Reference

Chromatic Scale (Hz) — Octaves 2–6

Common Scales (Hz values at octave 4)

Chord Formulas

Common Progressions with Hz

Composition Principles

Core Synthesis Techniques

Waveform Recipes (use these, not bare sine)

aevalsrc — Expression-based synthesis (primary tool)

anoisesrc — Noise-based percussion

Drum sample recipes (always layer, never single-source)

SoX Synthesis

Waveform types

Single tone

Chord (multiple oscillators)

Note sequence

Kick drum (frequency sweep)

Plucked string

Effects

Mixing & looping with SoX

When to use SoX vs ffmpeg

Building Patterns

Drum hits with adelay + amix

Looping bars to fill duration with -stream_loop

Melodic sequences with aevalsrc

Layer Recipes

Melody Layer

Bass Layer

Drum Layer

Pad Layer

Vinyl / Noise Texture Layer

Effects Reference

Mixing & Exporting

Mix all layers

Export to MP3

Verify with ffprobe

Structure & Arrangement

Concatenating sections

Fade in / fade out

Genre Templates

Lo-fi Hip-Hop

Ambient

Electronic / Techno

Synthwave / Retro

Complete Workflow Checklist

Troubleshooting

Songsee

Video Frames

Gifgrep

Qqbot Media

Camsnap

Openai Whisper Api

`aevalsrc` — Expression-based synthesis (primary tool)

`anoisesrc` — Noise-based percussion

Drum hits with `adelay` + `amix`

Looping bars to fill duration with `-stream_loop`

Melodic sequences with `aevalsrc`