@siteed/expo-audio-studio
Version:
Comprehensive audio processing library for React Native and Expo with recording, analysis, visualization, and streaming capabilities across iOS, Android, and web
562 lines (522 loc) • 21.7 kB
text/typescript
/*
* There is a bug where `navigator.mediaDevices.getUserMedia` + `MediaRecorder`
* creates WEBM files without duration metadata. See:
* - https://bugs.chromium.org/p/chromium/issues/detail?id=642012
* - https://stackoverflow.com/a/39971175/13989043
*
* This file contains a function that fixes the duration metadata of a WEBM file.
* - Answer found: https://stackoverflow.com/a/75218309/13989043
* - Code adapted from: https://github.com/mat-sz/webm-fix-duration
* (forked from https://github.com/yusitnikov/fix-webm-duration)
*/
/*
* This is the list of possible WEBM file sections by their IDs.
* Possible types: Container, Binary, Uint, Int, String, Float, Date
*/
interface Section {
name: string
type: string
}
const sections: Record<number, Section> = {
0xa45dfa3: { name: 'EBML', type: 'Container' },
0x286: { name: 'EBMLVersion', type: 'Uint' },
0x2f7: { name: 'EBMLReadVersion', type: 'Uint' },
0x2f2: { name: 'EBMLMaxIDLength', type: 'Uint' },
0x2f3: { name: 'EBMLMaxSizeLength', type: 'Uint' },
0x282: { name: 'DocType', type: 'String' },
0x287: { name: 'DocTypeVersion', type: 'Uint' },
0x285: { name: 'DocTypeReadVersion', type: 'Uint' },
0x6c: { name: 'Void', type: 'Binary' },
0x3f: { name: 'CRC-32', type: 'Binary' },
0xb538667: { name: 'SignatureSlot', type: 'Container' },
0x3e8a: { name: 'SignatureAlgo', type: 'Uint' },
0x3e9a: { name: 'SignatureHash', type: 'Uint' },
0x3ea5: { name: 'SignaturePublicKey', type: 'Binary' },
0x3eb5: { name: 'Signature', type: 'Binary' },
0x3e5b: { name: 'SignatureElements', type: 'Container' },
0x3e7b: { name: 'SignatureElementList', type: 'Container' },
0x2532: { name: 'SignedElement', type: 'Binary' },
0x8538067: { name: 'Segment', type: 'Container' },
0x14d9b74: { name: 'SeekHead', type: 'Container' },
0xdbb: { name: 'Seek', type: 'Container' },
0x13ab: { name: 'SeekID', type: 'Binary' },
0x13ac: { name: 'SeekPosition', type: 'Uint' },
0x549a966: { name: 'Info', type: 'Container' },
0x33a4: { name: 'SegmentUID', type: 'Binary' },
0x3384: { name: 'SegmentFilename', type: 'String' },
0x1cb923: { name: 'PrevUID', type: 'Binary' },
0x1c83ab: { name: 'PrevFilename', type: 'String' },
0x1eb923: { name: 'NextUID', type: 'Binary' },
0x1e83bb: { name: 'NextFilename', type: 'String' },
0x444: { name: 'SegmentFamily', type: 'Binary' },
0x2924: { name: 'ChapterTranslate', type: 'Container' },
0x29fc: { name: 'ChapterTranslateEditionUID', type: 'Uint' },
0x29bf: { name: 'ChapterTranslateCodec', type: 'Uint' },
0x29a5: { name: 'ChapterTranslateID', type: 'Binary' },
0xad7b1: { name: 'TimecodeScale', type: 'Uint' },
0x489: { name: 'Duration', type: 'Float' },
0x461: { name: 'DateUTC', type: 'Date' },
0x3ba9: { name: 'Title', type: 'String' },
0xd80: { name: 'MuxingApp', type: 'String' },
0x1741: { name: 'WritingApp', type: 'String' },
// 0xf43b675: { name: 'Cluster', type: 'Container' },
0x67: { name: 'Timecode', type: 'Uint' },
0x1854: { name: 'SilentTracks', type: 'Container' },
0x18d7: { name: 'SilentTrackNumber', type: 'Uint' },
0x27: { name: 'Position', type: 'Uint' },
0x2b: { name: 'PrevSize', type: 'Uint' },
0x23: { name: 'SimpleBlock', type: 'Binary' },
0x20: { name: 'BlockGroup', type: 'Container' },
0x21: { name: 'Block', type: 'Binary' },
0x22: { name: 'BlockVirtual', type: 'Binary' },
0x35a1: { name: 'BlockAdditions', type: 'Container' },
0x26: { name: 'BlockMore', type: 'Container' },
0x6e: { name: 'BlockAddID', type: 'Uint' },
0x25: { name: 'BlockAdditional', type: 'Binary' },
0x1b: { name: 'BlockDuration', type: 'Uint' },
0x7a: { name: 'ReferencePriority', type: 'Uint' },
0x7b: { name: 'ReferenceBlock', type: 'Int' },
0x7d: { name: 'ReferenceVirtual', type: 'Int' },
0x24: { name: 'CodecState', type: 'Binary' },
0x35a2: { name: 'DiscardPadding', type: 'Int' },
0xe: { name: 'Slices', type: 'Container' },
0x68: { name: 'TimeSlice', type: 'Container' },
0x4c: { name: 'LaceNumber', type: 'Uint' },
0x4d: { name: 'FrameNumber', type: 'Uint' },
0x4b: { name: 'BlockAdditionID', type: 'Uint' },
0x4e: { name: 'Delay', type: 'Uint' },
0x4f: { name: 'SliceDuration', type: 'Uint' },
0x48: { name: 'ReferenceFrame', type: 'Container' },
0x49: { name: 'ReferenceOffset', type: 'Uint' },
0x4a: { name: 'ReferenceTimeCode', type: 'Uint' },
0x2f: { name: 'EncryptedBlock', type: 'Binary' },
0x654ae6b: { name: 'Tracks', type: 'Container' },
0x2e: { name: 'TrackEntry', type: 'Container' },
0x57: { name: 'TrackNumber', type: 'Uint' },
0x33c5: { name: 'TrackUID', type: 'Uint' },
0x3: { name: 'TrackType', type: 'Uint' },
0x39: { name: 'FlagEnabled', type: 'Uint' },
0x8: { name: 'FlagDefault', type: 'Uint' },
0x15aa: { name: 'FlagForced', type: 'Uint' },
0x1c: { name: 'FlagLacing', type: 'Uint' },
0x2de7: { name: 'MinCache', type: 'Uint' },
0x2df8: { name: 'MaxCache', type: 'Uint' },
0x3e383: { name: 'DefaultDuration', type: 'Uint' },
0x34e7a: { name: 'DefaultDecodedFieldDuration', type: 'Uint' },
0x3314f: { name: 'TrackTimecodeScale', type: 'Float' },
0x137f: { name: 'TrackOffset', type: 'Int' },
0x15ee: { name: 'MaxBlockAdditionID', type: 'Uint' },
0x136e: { name: 'Name', type: 'String' },
0x2b59c: { name: 'Language', type: 'String' },
0x6: { name: 'CodecID', type: 'String' },
0x23a2: { name: 'CodecPrivate', type: 'Binary' },
0x58688: { name: 'CodecName', type: 'String' },
0x3446: { name: 'AttachmentLink', type: 'Uint' },
0x1a9697: { name: 'CodecSettings', type: 'String' },
0x1b4040: { name: 'CodecInfoURL', type: 'String' },
0x6b240: { name: 'CodecDownloadURL', type: 'String' },
0x2a: { name: 'CodecDecodeAll', type: 'Uint' },
0x2fab: { name: 'TrackOverlay', type: 'Uint' },
0x16aa: { name: 'CodecDelay', type: 'Uint' },
0x16bb: { name: 'SeekPreRoll', type: 'Uint' },
0x2624: { name: 'TrackTranslate', type: 'Container' },
0x26fc: { name: 'TrackTranslateEditionUID', type: 'Uint' },
0x26bf: { name: 'TrackTranslateCodec', type: 'Uint' },
0x26a5: { name: 'TrackTranslateTrackID', type: 'Binary' },
0x60: { name: 'Video', type: 'Container' },
0x1a: { name: 'FlagInterlaced', type: 'Uint' },
0x13b8: { name: 'StereoMode', type: 'Uint' },
0x13c0: { name: 'AlphaMode', type: 'Uint' },
0x13b9: { name: 'OldStereoMode', type: 'Uint' },
0x30: { name: 'PixelWidth', type: 'Uint' },
0x3a: { name: 'PixelHeight', type: 'Uint' },
0x14aa: { name: 'PixelCropBottom', type: 'Uint' },
0x14bb: { name: 'PixelCropTop', type: 'Uint' },
0x14cc: { name: 'PixelCropLeft', type: 'Uint' },
0x14dd: { name: 'PixelCropRight', type: 'Uint' },
0x14b0: { name: 'DisplayWidth', type: 'Uint' },
0x14ba: { name: 'DisplayHeight', type: 'Uint' },
0x14b2: { name: 'DisplayUnit', type: 'Uint' },
0x14b3: { name: 'AspectRatioType', type: 'Uint' },
0xeb524: { name: 'ColourSpace', type: 'Binary' },
0xfb523: { name: 'GammaValue', type: 'Float' },
0x383e3: { name: 'FrameRate', type: 'Float' },
0x61: { name: 'Audio', type: 'Container' },
0x35: { name: 'SamplingFrequency', type: 'Float' },
0x38b5: { name: 'OutputSamplingFrequency', type: 'Float' },
0x1f: { name: 'Channels', type: 'Uint' },
0x3d7b: { name: 'ChannelPositions', type: 'Binary' },
0x2264: { name: 'BitDepth', type: 'Uint' },
0x62: { name: 'TrackOperation', type: 'Container' },
0x63: { name: 'TrackCombinePlanes', type: 'Container' },
0x64: { name: 'TrackPlane', type: 'Container' },
0x65: { name: 'TrackPlaneUID', type: 'Uint' },
0x66: { name: 'TrackPlaneType', type: 'Uint' },
0x69: { name: 'TrackJoinBlocks', type: 'Container' },
0x6d: { name: 'TrackJoinUID', type: 'Uint' },
0x40: { name: 'TrickTrackUID', type: 'Uint' },
0x41: { name: 'TrickTrackSegmentUID', type: 'Binary' },
0x46: { name: 'TrickTrackFlag', type: 'Uint' },
0x47: { name: 'TrickMasterTrackUID', type: 'Uint' },
0x44: { name: 'TrickMasterTrackSegmentUID', type: 'Binary' },
0x2d80: { name: 'ContentEncodings', type: 'Container' },
0x2240: { name: 'ContentEncoding', type: 'Container' },
0x1031: { name: 'ContentEncodingOrder', type: 'Uint' },
0x1032: { name: 'ContentEncodingScope', type: 'Uint' },
0x1033: { name: 'ContentEncodingType', type: 'Uint' },
0x1034: { name: 'ContentCompression', type: 'Container' },
0x254: { name: 'ContentCompAlgo', type: 'Uint' },
0x255: { name: 'ContentCompSettings', type: 'Binary' },
0x1035: { name: 'ContentEncryption', type: 'Container' },
0x7e1: { name: 'ContentEncAlgo', type: 'Uint' },
0x7e2: { name: 'ContentEncKeyID', type: 'Binary' },
0x7e3: { name: 'ContentSignature', type: 'Binary' },
0x7e4: { name: 'ContentSigKeyID', type: 'Binary' },
0x7e5: { name: 'ContentSigAlgo', type: 'Uint' },
0x7e6: { name: 'ContentSigHashAlgo', type: 'Uint' },
0xc53bb6b: { name: 'Cues', type: 'Container' },
0x3b: { name: 'CuePoint', type: 'Container' },
0x33: { name: 'CueTime', type: 'Uint' },
0x37: { name: 'CueTrackPositions', type: 'Container' },
0x77: { name: 'CueTrack', type: 'Uint' },
0x71: { name: 'CueClusterPosition', type: 'Uint' },
0x70: { name: 'CueRelativePosition', type: 'Uint' },
0x32: { name: 'CueDuration', type: 'Uint' },
0x1378: { name: 'CueBlockNumber', type: 'Uint' },
0x6a: { name: 'CueCodecState', type: 'Uint' },
0x5b: { name: 'CueReference', type: 'Container' },
0x16: { name: 'CueRefTime', type: 'Uint' },
0x17: { name: 'CueRefCluster', type: 'Uint' },
0x135f: { name: 'CueRefNumber', type: 'Uint' },
0x6b: { name: 'CueRefCodecState', type: 'Uint' },
0x941a469: { name: 'Attachments', type: 'Container' },
0x21a7: { name: 'AttachedFile', type: 'Container' },
0x67e: { name: 'FileDescription', type: 'String' },
0x66e: { name: 'FileName', type: 'String' },
0x660: { name: 'FileMimeType', type: 'String' },
0x65c: { name: 'FileData', type: 'Binary' },
0x6ae: { name: 'FileUID', type: 'Uint' },
0x675: { name: 'FileReferral', type: 'Binary' },
0x661: { name: 'FileUsedStartTime', type: 'Uint' },
0x662: { name: 'FileUsedEndTime', type: 'Uint' },
0x43a770: { name: 'Chapters', type: 'Container' },
0x5b9: { name: 'EditionEntry', type: 'Container' },
0x5bc: { name: 'EditionUID', type: 'Uint' },
0x5bd: { name: 'EditionFlagHidden', type: 'Uint' },
0x5db: { name: 'EditionFlagDefault', type: 'Uint' },
0x5dd: { name: 'EditionFlagOrdered', type: 'Uint' },
0x36: { name: 'ChapterAtom', type: 'Container' },
0x33c4: { name: 'ChapterUID', type: 'Uint' },
0x1654: { name: 'ChapterStringUID', type: 'String' },
0x11: { name: 'ChapterTimeStart', type: 'Uint' },
0x12: { name: 'ChapterTimeEnd', type: 'Uint' },
0x18: { name: 'ChapterFlagHidden', type: 'Uint' },
0x598: { name: 'ChapterFlagEnabled', type: 'Uint' },
0x2e67: { name: 'ChapterSegmentUID', type: 'Binary' },
0x2ebc: { name: 'ChapterSegmentEditionUID', type: 'Uint' },
0x23c3: { name: 'ChapterPhysicalEquiv', type: 'Uint' },
0xf: { name: 'ChapterTrack', type: 'Container' },
0x9: { name: 'ChapterTrackNumber', type: 'Uint' },
0x0: { name: 'ChapterDisplay', type: 'Container' },
0x5: { name: 'ChapString', type: 'String' },
0x37c: { name: 'ChapLanguage', type: 'String' },
0x37e: { name: 'ChapCountry', type: 'String' },
0x2944: { name: 'ChapProcess', type: 'Container' },
0x2955: { name: 'ChapProcessCodecID', type: 'Uint' },
0x50d: { name: 'ChapProcessPrivate', type: 'Binary' },
0x2911: { name: 'ChapProcessCommand', type: 'Container' },
0x2922: { name: 'ChapProcessTime', type: 'Uint' },
0x2933: { name: 'ChapProcessData', type: 'Binary' },
0x254c367: { name: 'Tags', type: 'Container' },
0x3373: { name: 'Tag', type: 'Container' },
0x23c0: { name: 'Targets', type: 'Container' },
0x28ca: { name: 'TargetTypeValue', type: 'Uint' },
0x23ca: { name: 'TargetType', type: 'String' },
0x23c5: { name: 'TagTrackUID', type: 'Uint' },
0x23c9: { name: 'TagEditionUID', type: 'Uint' },
0x23c4: { name: 'TagChapterUID', type: 'Uint' },
0x23c6: { name: 'TagAttachmentUID', type: 'Uint' },
0x27c8: { name: 'SimpleTag', type: 'Container' },
0x5a3: { name: 'TagName', type: 'String' },
0x47a: { name: 'TagLanguage', type: 'String' },
0x484: { name: 'TagDefault', type: 'Uint' },
0x487: { name: 'TagString', type: 'String' },
0x485: { name: 'TagBinary', type: 'Binary' },
}
class WebmBase<T> {
source?: Uint8Array
data?: T
name: string
type: string
constructor(name = 'Unknown', type = 'Unknown') {
this.name = name
this.type = type
}
updateBySource() {}
setSource(source: Uint8Array) {
this.source = source
this.updateBySource()
}
updateByData() {}
setData(data: T) {
this.data = data
this.updateByData()
}
}
class WebmUint extends WebmBase<string> {
constructor(name: string, type: string) {
super(name, type || 'Uint')
}
updateBySource() {
// use hex representation of a number instead of number value
this.data = ''
for (let i = 0; i < this.source!.length; i++) {
const hex = this.source![i].toString(16)
this.data += padHex(hex)
}
}
updateByData() {
const length = this.data!.length / 2
this.source = new Uint8Array(length)
for (let i = 0; i < length; i++) {
const hex = this.data!.substr(i * 2, 2)
this.source[i] = parseInt(hex, 16)
}
}
getValue() {
return parseInt(this.data!, 16)
}
setValue(value: number) {
this.setData(padHex(value.toString(16)))
}
}
function padHex(hex: string) {
return hex.length % 2 === 1 ? '0' + hex : hex
}
class WebmFloat extends WebmBase<number> {
constructor(name: string, type: string) {
super(name, type || 'Float')
}
getFloatArrayType() {
return this.source && this.source.length === 4
? Float32Array
: Float64Array
}
updateBySource() {
const byteArray = this.source!.reverse()
const floatArrayType = this.getFloatArrayType()
const buffer = new ArrayBuffer(byteArray.buffer.byteLength)
new Uint8Array(buffer).set(new Uint8Array(byteArray.buffer))
const floatArray = new floatArrayType(buffer)
this.data! = floatArray[0]
}
updateByData() {
const floatArrayType = this.getFloatArrayType()
const floatArray = new floatArrayType([this.data!])
const byteArray = new Uint8Array(floatArray.buffer)
this.source = byteArray.reverse()
}
getValue() {
return this.data
}
setValue(value: number) {
this.setData(value)
}
}
interface ContainerData {
id: number
idHex?: string
// eslint-disable-next-line @typescript-eslint/no-explicit-any
data: WebmBase<any>
}
class WebmContainer extends WebmBase<ContainerData[]> {
offset: number = 0
data: ContainerData[] = []
constructor(name: string, type: string) {
super(name, type || 'Container')
}
readByte() {
return this.source![this.offset++]
}
readUint() {
const firstByte = this.readByte()
const bytes = 8 - firstByte.toString(2).length
let value = firstByte - (1 << (7 - bytes))
for (let i = 0; i < bytes; i++) {
// don't use bit operators to support x86
value *= 256
value += this.readByte()
}
return value
}
updateBySource() {
let end: number | undefined = undefined
this.data = []
for (
this.offset = 0;
this.offset < this.source!.length;
this.offset = end
) {
const id = this.readUint()
const len = this.readUint()
end = Math.min(this.offset + len, this.source!.length)
const data = this.source!.slice(this.offset, end)
const info = sections[id] || { name: 'Unknown', type: 'Unknown' }
// eslint-disable-next-line @typescript-eslint/no-explicit-any
let ctr: any = WebmBase
switch (info.type) {
case 'Container':
ctr = WebmContainer
break
case 'Uint':
ctr = WebmUint
break
case 'Float':
ctr = WebmFloat
break
}
const section = new ctr(info.name, info.type)
section.setSource(data)
this.data.push({
id,
idHex: id.toString(16),
data: section,
})
}
}
writeUint(x: number, draft = false) {
let flag = 0x80
let bytes = 1
// eslint-disable-next-line no-empty
for (; x >= flag && bytes < 8; bytes++, flag *= 0x80) {}
if (!draft) {
let value = flag + x
for (let i = bytes - 1; i >= 0; i--) {
// don't use bit operators to support x86
const c = value % 256
this.source![this.offset! + i] = c
value = (value - c) / 256
}
}
this.offset += bytes
}
writeSections(draft = false) {
this.offset = 0
for (let i = 0; i < this.data.length; i++) {
const section = this.data[i],
content = section.data.source,
contentLength = content!.length
this.writeUint(section.id, draft)
this.writeUint(contentLength, draft)
if (!draft) {
this.source!.set(content!, this.offset)
}
this.offset += contentLength
}
return this.offset
}
updateByData() {
// run without accessing this.source to determine total length - need to know it to create Uint8Array
const length = this.writeSections(true)
this.source = new Uint8Array(length)
// now really write data
this.writeSections()
}
getSectionById(id: number) {
for (let i = 0; i < this.data.length; i++) {
const section = this.data[i]
if (section.id === id) {
return section.data
}
}
return undefined
}
}
class WebmFile extends WebmContainer {
constructor(source: Uint8Array) {
super('File', 'File')
this.setSource(source)
}
fixDuration(duration: number) {
const segmentSection = this.getSectionById(0x8538067) as WebmContainer
if (!segmentSection) {
return false
}
const infoSection = segmentSection.getSectionById(
0x549a966
) as WebmContainer
if (!infoSection) {
return false
}
const timeScaleSection = infoSection.getSectionById(
0xad7b1
) as WebmFloat
if (!timeScaleSection) {
return false
}
let durationSection = infoSection.getSectionById(0x489) as WebmFloat
if (durationSection) {
if (durationSection.getValue()! <= 0) {
durationSection.setValue(duration)
} else {
return false
}
} else {
// append Duration section
durationSection = new WebmFloat('Duration', 'Float')
durationSection.setValue(duration)
infoSection.data.push({
id: 0x489,
data: durationSection,
})
}
// set default time scale to 1 millisecond (1000000 nanoseconds)
timeScaleSection.setValue(1000000)
infoSection.updateByData()
segmentSection.updateByData()
this.updateByData()
return true
}
toBlob(type = 'video/webm') {
const buffer = new ArrayBuffer(this.source!.buffer.byteLength)
new Uint8Array(buffer).set(new Uint8Array(this.source!.buffer))
return new Blob([buffer], { type })
}
}
/**
* Fixes duration on MediaRecorder output.
* @param blob Input Blob with incorrect duration.
* @param duration Correct duration (in milliseconds).
* @param type Output blob mimetype (default: video/webm).
* @returns
*/
export const webmFixDuration = (
blob: Blob,
duration: number,
type = 'video/webm'
): Promise<Blob> => {
return new Promise((resolve, reject) => {
try {
const reader = new FileReader()
reader.addEventListener('loadend', () => {
try {
const result = reader.result as ArrayBuffer
const file = new WebmFile(new Uint8Array(result))
if (file.fixDuration(duration)) {
resolve(file.toBlob(type))
} else {
resolve(blob)
}
} catch (ex) {
reject(ex)
}
})
reader.addEventListener('error', () =>
reject(new Error('FileReader error'))
)
reader.readAsArrayBuffer(blob)
} catch (ex) {
reject(ex)
}
})
}