TeaWeb/shared/js/voice/RecorderBase.ts

326 lines
10 KiB
TypeScript

import {InputDevice} from "../audio/Recorder";
import {Registry} from "../events";
import {Filter, FilterType, FilterTypeClass} from "../voice/Filter";
export enum InputConsumerType {
CALLBACK,
NODE,
NATIVE
}
export interface CallbackInputConsumer {
type: InputConsumerType.CALLBACK;
callbackAudio?: (buffer: AudioBuffer) => any;
callbackBuffer?: (buffer: Float32Array, samples: number, channels: number) => any;
}
export interface NodeInputConsumer {
type: InputConsumerType.NODE;
callbackNode: (source_node: AudioNode) => any;
callbackDisconnect: (source_node: AudioNode) => any;
}
export interface NativeInputConsumer {
type: InputConsumerType.NATIVE;
}
export type InputConsumer = CallbackInputConsumer | NodeInputConsumer | NativeInputConsumer;
export enum InputState {
/* Input recording has been paused */
PAUSED,
/*
* Recording has been requested, and is currently initializing.
*/
INITIALIZING,
/* we're currently recording the input. */
RECORDING
}
export enum InputStartError {
EUNKNOWN = "eunknown",
EDEVICEUNKNOWN = "edeviceunknown",
EBUSY = "ebusy",
ENOTALLOWED = "enotallowed",
ESYSTEMDENIED = "esystemdenied",
ENOTSUPPORTED = "enotsupported",
ESYSTEMUNINITIALIZED = "esystemuninitialized"
}
export interface InputEvents {
notify_state_changed: {
oldState: InputState,
newState: InputState
},
notify_voice_start: {},
notify_voice_end: {},
notify_filter_mode_changed: { oldMode: FilterMode, newMode: FilterMode },
notify_device_changed: { oldDeviceId: string, newDeviceId: string },
}
export enum FilterMode {
/**
* Apply all filters and act according to the output
*/
Filter,
/**
* Bypass all filters and replay the audio
*/
Bypass,
/**
* Block all communication
*/
Block
}
/**
* All available options for input processing.
* Since input processing is only available on the native client these are the options
* the native client (especially WebRTC audio processing) have.
*/
export interface InputProcessorConfigWebRTC {
"pipeline.maximum_internal_processing_rate": number,
"pipeline.multi_channel_render": boolean,
"pipeline.multi_channel_capture": boolean,
"pre_amplifier.enabled": boolean,
"pre_amplifier.fixed_gain_factor": number,
"high_pass_filter.enabled": boolean,
"high_pass_filter.apply_in_full_band": boolean,
"echo_canceller.enabled": boolean,
"echo_canceller.mobile_mode": boolean,
"echo_canceller.export_linear_aec_output": boolean,
"echo_canceller.enforce_high_pass_filtering": boolean,
"noise_suppression.enabled": boolean,
"noise_suppression.level": "low" | "moderate" | "high" | "very-high",
"noise_suppression.analyze_linear_aec_output_when_available": boolean,
"transient_suppression.enabled": boolean,
"voice_detection.enabled": boolean,
"gain_controller1.enabled": boolean,
"gain_controller1.mode": "adaptive-analog" | "adaptive-digital" | "fixed-digital",
"gain_controller1.target_level_dbfs": number,
"gain_controller1.compression_gain_db": number,
"gain_controller1.enable_limiter": boolean,
"gain_controller1.analog_level_minimum": number,
"gain_controller1.analog_level_maximum": number,
"gain_controller1.analog_gain_controller.enabled": boolean,
"gain_controller1.analog_gain_controller.startup_min_volume": number,
"gain_controller1.analog_gain_controller.clipped_level_min": number,
"gain_controller1.analog_gain_controller.enable_agc2_level_estimator": boolean,
"gain_controller1.analog_gain_controller.enable_digital_adaptive": boolean,
"gain_controller2.enabled": boolean,
"gain_controller2.fixed_digital.gain_db": number,
"gain_controller2.adaptive_digital.enabled": boolean,
"gain_controller2.adaptive_digital.vad_probability_attack": number,
"gain_controller2.adaptive_digital.level_estimator": "rms" | "peak",
"gain_controller2.adaptive_digital.level_estimator_adjacent_speech_frames_threshold": number,
"gain_controller2.adaptive_digital.use_saturation_protector": boolean,
"gain_controller2.adaptive_digital.initial_saturation_margin_db": number,
"gain_controller2.adaptive_digital.extra_saturation_margin_db": number,
"gain_controller2.adaptive_digital.gain_applier_adjacent_speech_frames_threshold": number,
"gain_controller2.adaptive_digital.max_gain_change_db_per_second": number,
"gain_controller2.adaptive_digital.max_output_noise_level_dbfs": number,
"residual_echo_detector.enabled": boolean,
"level_estimation.enabled": boolean,
}
/**
* Attention:
* These keys **MUST** be equal to all keys of `InputProcessorConfigWebRTC`.
* All keys not registered in here will not be consideration.
*/
export const kInputProcessorConfigWebRTCKeys: (keyof InputProcessorConfigWebRTC)[] = [
"pipeline.maximum_internal_processing_rate",
"pipeline.multi_channel_render",
"pipeline.multi_channel_capture",
"pre_amplifier.enabled",
"pre_amplifier.fixed_gain_factor",
"high_pass_filter.enabled",
"high_pass_filter.apply_in_full_band",
"echo_canceller.enabled",
"echo_canceller.mobile_mode",
"echo_canceller.export_linear_aec_output",
"echo_canceller.enforce_high_pass_filtering",
"noise_suppression.enabled",
"noise_suppression.level",
"noise_suppression.analyze_linear_aec_output_when_available",
"transient_suppression.enabled",
"voice_detection.enabled",
"gain_controller1.enabled",
"gain_controller1.mode",
"gain_controller1.target_level_dbfs",
"gain_controller1.compression_gain_db",
"gain_controller1.enable_limiter",
"gain_controller1.analog_level_minimum",
"gain_controller1.analog_level_maximum",
"gain_controller1.analog_gain_controller.enabled",
"gain_controller1.analog_gain_controller.startup_min_volume",
"gain_controller1.analog_gain_controller.clipped_level_min",
"gain_controller1.analog_gain_controller.enable_agc2_level_estimator",
"gain_controller1.analog_gain_controller.enable_digital_adaptive",
"gain_controller2.enabled",
"gain_controller2.fixed_digital.gain_db",
"gain_controller2.adaptive_digital.enabled",
"gain_controller2.adaptive_digital.vad_probability_attack",
"gain_controller2.adaptive_digital.level_estimator",
"gain_controller2.adaptive_digital.level_estimator_adjacent_speech_frames_threshold",
"gain_controller2.adaptive_digital.use_saturation_protector",
"gain_controller2.adaptive_digital.initial_saturation_margin_db",
"gain_controller2.adaptive_digital.extra_saturation_margin_db",
"gain_controller2.adaptive_digital.gain_applier_adjacent_speech_frames_threshold",
"gain_controller2.adaptive_digital.max_gain_change_db_per_second",
"gain_controller2.adaptive_digital.max_output_noise_level_dbfs",
"residual_echo_detector.enabled",
"level_estimation.enabled"
];
export interface InputProcessorConfigRNNoise {
"rnnoise.enabled": boolean
}
/**
* Attention:
* These keys **MUST** be equal to all keys of `InputProcessorConfigWebRTC`.
* All keys not registered in here will not be consideration.
*/
export const kInputProcessorConfigRNNoiseKeys: (keyof InputProcessorConfigRNNoise)[] = [
"rnnoise.enabled"
];
export interface InputProcessorConfigMapping {
"webrtc-processing": InputProcessorConfigWebRTC,
"rnnoise": InputProcessorConfigRNNoise
}
export type InputProcessorType = keyof InputProcessorConfigMapping;
export interface InputProcessorStatistics {
/* WebRTC processor statistics */
output_rms_dbfs: number | undefined,
voice_detected: number | undefined,
echo_return_loss: number | undefined,
echo_return_loss_enhancement: number | undefined,
divergent_filter_fraction: number | undefined,
delay_median_ms: number | undefined,
delay_standard_deviation_ms: number | undefined,
residual_echo_likelihood: number | undefined,
residual_echo_likelihood_recent_max: number | undefined,
delay_ms: number | undefined,
/* RNNoise processor statistics */
rnnoise_volume: number | undefined
}
export interface InputProcessor {
/**
* @param processor Target processor type
* @returns `true` if the target processor type is supported and available
*/
hasProcessor(processor: InputProcessorType): boolean;
/**
* Get the processor config of the target type.
* This method will throw when the target processor isn't supported.
* @param processor Target processor type.
* @returns The processor config.
*/
getProcessorConfig<T extends InputProcessorType>(processor: T) : InputProcessorConfigMapping[T];
/**
* Apply the target config.
* @param processor
* @param config
*/
applyProcessorConfig<T extends InputProcessorType>(processor: T, config: InputProcessorConfigMapping[T]);
/**
* Get the current processor statistics.
*/
getStatistics() : InputProcessorStatistics;
}
export interface AbstractInput {
readonly events: Registry<InputEvents>;
currentState() : InputState;
destroy();
start() : Promise<InputStartError | true>;
stop() : Promise<void>;
/*
* Returns true if the input is currently filtered.
* If the current state isn't recording, than it will return true.
*/
isFiltered() : boolean;
getFilterMode() : FilterMode;
setFilterMode(mode: FilterMode);
currentDeviceId() : string | undefined;
/**
* This method should not throw!
* If the target device is unknown, it should return `InputStartError.EDEVICEUNKNOWN` on start.
* If the device is different than the current device the recorder stops.
*
* When the device has been changed the event `notify_device_changed` will be fired.
*/
setDeviceId(device: string) : Promise<void>;
currentConsumer() : InputConsumer | undefined;
setConsumer(consumer: InputConsumer) : Promise<void>;
supportsFilter(type: FilterType) : boolean;
createFilter<T extends FilterType>(type: T, priority: number) : FilterTypeClass<T>;
removeFilter(filter: Filter);
getVolume() : number;
setVolume(volume: number);
getInputProcessor() : InputProcessor;
/**
* Create a new level meter for this audio input.
* This level meter will be indicate the audio level after all processing.
* Note: Changing the input device or stopping the input will result in no activity.
*/
createLevelMeter() : LevelMeter;
}
export interface LevelMeter {
getDevice() : InputDevice;
setObserver(callback: (value: number) => any);
destroy();
}