libcm is a C development framework with an emphasis on audio signal processing applications.
Du kan inte välja fler än 25 ämnen Ämnen måste starta med en bokstav eller siffra, kan innehålla bindestreck ('-') och vara max 35 tecken långa.

cmProc4.h 20KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534
  1. #ifndef cmProc4_h
  2. #define cmProc4_h
  3. #ifdef __cplusplus
  4. extern "C" {
  5. #endif
  6. typedef struct
  7. {
  8. unsigned smpIdx; // time tag sample index for val
  9. cmMidiByte_t val; //
  10. bool validFl; //
  11. } cmScFolBufEle_t;
  12. typedef struct
  13. {
  14. unsigned pitch;
  15. unsigned scEvtIdx;
  16. } cmScFolEvt_t;
  17. typedef struct
  18. {
  19. unsigned evtCnt; //
  20. cmScFolEvt_t* evtV; // pitchV[pitchCnt]
  21. unsigned scIdx; // index of the score loc (into cmScoreEvt[]) at this location
  22. int barNumb; // bar number of this location
  23. } cmScFolLoc_t;
  24. typedef struct
  25. {
  26. cmObj obj;
  27. cmReal_t srate; //
  28. cmScH_t scH; // score handle
  29. unsigned bufN; // event buffer count
  30. cmScFolBufEle_t* bufV; // event buffer bufV[bufN] - bufV[bufN-1] newest event, bufV[boi] oldest event
  31. int locN; // count of score locations
  32. cmScFolLoc_t* loc; // score loc[locN]
  33. unsigned sbi; // oldest score window index
  34. unsigned sei; // newest score window index
  35. unsigned msln; // minimum score look ahead count
  36. unsigned mswn; // maximum score window length
  37. unsigned forwardCnt; // count of score loc's to look ahead for a match to the current pitch when the optimal edit-dist alignment does not produce a match for the current pitch
  38. unsigned maxDist; // max. dist allowed to still consider matching
  39. unsigned minVel; // notes < minVel are ignored
  40. bool printFl; // true if pitch tracker reporting should be included
  41. bool noBackFl; // prevent the tracker from going backwards in time
  42. unsigned* edWndMtx;
  43. unsigned missCnt; // current consecutive unmatched notes
  44. unsigned matchCnt; // current consecutive matched notes
  45. unsigned eventIdx; // events since reset
  46. unsigned skipCnt; // notes skipped due to velocity
  47. unsigned ret_idx; // last tracked location
  48. } cmScFol;
  49. cmScFol* cmScFolAlloc( cmCtx* ctx, cmScFol* p, cmReal_t srate, cmScH_t scH, unsigned bufN, unsigned minWndLookAhead, unsigned maxWndCnt, unsigned minVel );
  50. cmRC_t cmScFolFree( cmScFol** pp );
  51. cmRC_t cmScFolInit( cmScFol* p, cmReal_t srate, cmScH_t scH, unsigned bufN, unsigned minWndLookAhead, unsigned maxWndCnt, unsigned minVel );
  52. cmRC_t cmScFolFinal( cmScFol* p );
  53. // Jump to a score location and reset the internal state of the follower.
  54. cmRC_t cmScFolReset( cmScFol* p, unsigned scoreIndex );
  55. // Give the follower a MIDI performance event. Only MIDI note-on events are acted upon;
  56. // all others are ignored.
  57. unsigned cmScFolExec( cmScFol* p, unsigned smpIdx, unsigned status, cmMidiByte_t d0, cmMidiByte_t d1 );
  58. //=======================================================================================================================
  59. typedef struct
  60. {
  61. unsigned pitch;
  62. unsigned scEvtIdx;
  63. bool matchFl;
  64. } cmScTrkEvt_t;
  65. typedef struct
  66. {
  67. unsigned evtCnt; //
  68. cmScTrkEvt_t* evtV; // evtV[evtCnt]
  69. unsigned scIdx; // index of the score event (into cmScoreEvt[]) at this location
  70. int barNumb; // bar number of this location
  71. } cmScTrkLoc_t;
  72. typedef struct
  73. {
  74. cmObj obj;
  75. cmScFol* sfp;
  76. double srate;
  77. cmScH_t scH;
  78. unsigned locN;
  79. cmScTrkLoc_t* loc;
  80. unsigned minVel;
  81. unsigned maxWndCnt;
  82. unsigned minWndLookAhead;
  83. bool printFl;
  84. int curLocIdx;
  85. unsigned evtIndex;
  86. } cmScTrk;
  87. cmScTrk* cmScTrkAlloc( cmCtx* ctx, cmScTrk* p, cmReal_t srate, cmScH_t scH, unsigned bufN, unsigned minWndLookAhead, unsigned maxWndCnt, unsigned minVel );
  88. cmRC_t cmScTrkFree( cmScTrk** pp );
  89. cmRC_t cmScTrkInit( cmScTrk* p, cmReal_t srate, cmScH_t scH, unsigned bufN, unsigned minWndLookAhead, unsigned maxWndCnt, unsigned minVel );
  90. cmRC_t cmScTrkFinal( cmScTrk* p );
  91. // Jump to a score location and reset the internal state of the follower.
  92. cmRC_t cmScTrkReset( cmScTrk* p, unsigned scoreIndex );
  93. // Give the follower a MIDI performance event. Only MIDI note-on events are acted upon;
  94. // all others are ignored.
  95. unsigned cmScTrkExec( cmScTrk* p, unsigned smpIdx, unsigned status, cmMidiByte_t d0, cmMidiByte_t d1 );
  96. //=======================================================================================================================
  97. //
  98. // Simplified string alignment function based on Levenshtein edit distance.
  99. //
  100. enum { kEdMinIdx, kEdSubIdx, kEdDelIdx, kEdInsIdx, kEdCnt };
  101. typedef struct
  102. {
  103. unsigned v[kEdCnt];
  104. bool matchFl;
  105. bool transFl;
  106. } ed_val;
  107. typedef struct ed_path_str
  108. {
  109. unsigned code;
  110. unsigned ri;
  111. unsigned ci;
  112. bool matchFl;
  113. bool transFl;
  114. struct ed_path_str* next;
  115. } ed_path;
  116. /*
  117. Backtracking:
  118. m[rn,cn] is organized to indicate the mutation operations
  119. on s0[0:rn-1] or s1[0:cn-1] during backtracking.
  120. Backtracking begins at cell m[rn-1,cn-1] and proceeds
  121. up and left toward m[0,0]. The action to perform during
  122. backtracking is determined by examinging which values
  123. int m[].v[1:3] match m[].v[0].
  124. Match Next Cell
  125. Index Operation Location
  126. ----- ------------------------ ------------------------
  127. 1 Substitute char s0[ri-1] move diagonally; up-left
  128. 2 Delete char s0[ri-1] move up.
  129. 3 Delete char s1[ci-1] move left.
  130. (same as inserting blank
  131. into after s[ri-1]
  132. Note that more than one value in m[].v[1:3] may match
  133. m[].v[0]. In this case the candidate solution branches
  134. at this point in the candidate selection processes.
  135. */
  136. typedef struct
  137. {
  138. const char* s0; // forms rows of m[] - mutate to match s1 - rn=strlen(s0)
  139. const char* s1; // forms columns of m[] - target string - cn=strlen(s1)
  140. unsigned rn; // length of s0 + 1
  141. unsigned cn; // length of s1 + 1
  142. ed_val* m; // m[rn,cn]
  143. unsigned pn; // rn+cn
  144. ed_path* p_mem; // pmem[ 2*pn ];
  145. ed_path* p_avl; // available path record linked list
  146. ed_path* p_cur; // current path linked list
  147. ed_path* p_opt; // p_opt[pn] current best alignment
  148. double s_opt; // score of the current best alignment
  149. } ed_r;
  150. // print the DP matrix ed_r.m[rn,cn].
  151. void ed_print_mtx( ed_r* r );
  152. // Initialize ed_r.
  153. void ed_init( ed_r* r, const char* s0, const char* s1 );
  154. // Fill in the DP matrix.
  155. void ed_calc_mtx( ed_r* r );
  156. // Traverse the possible alignments in the DP matrix and determine the optimal alignment.
  157. void ed_align( ed_r* r );
  158. // Print the optimal alignment p_opt[]
  159. void ed_print_opt( ed_r* r );
  160. // Free resource allocated by ed_init().
  161. void ed_free(ed_r* r);
  162. // Main test function.
  163. void ed_main();
  164. //=======================================================================================================================
  165. enum
  166. {
  167. kSmMinIdx,
  168. kSmSubIdx, // 'substitute' - may or may not match
  169. kSmDelIdx, // 'delete' - delete a MIDI note
  170. kSmInsIdx, // 'insert' - insert a space in the score
  171. kSmCnt
  172. };
  173. enum
  174. {
  175. kSmMatchFl = 0x01,
  176. kSmTransFl = 0x02
  177. };
  178. // Dynamic Programming (DP) matrix element
  179. typedef struct
  180. {
  181. unsigned v[kSmCnt]; //
  182. unsigned flags;
  183. } cmScMatchVal_t;
  184. // List record used to track a path through the DP matrix p->m[,]
  185. typedef struct cmScMatchPath_str
  186. {
  187. unsigned code;
  188. unsigned ri;
  189. unsigned ci;
  190. unsigned flags;
  191. unsigned locIdx;
  192. struct cmScMatchPath_str* next;
  193. } cmScMatchPath_t;
  194. typedef struct cmScMatchEvt_str
  195. {
  196. unsigned pitch;
  197. } cmScMatchEvt_t;
  198. // Score location record.
  199. typedef struct
  200. {
  201. unsigned evtCnt; //
  202. cmScMatchEvt_t* evtV; // evtV[evtCnt]
  203. unsigned scLocIdx; // scH score location index
  204. int barNumb; // bar number of this location
  205. } cmScMatchLoc_t;
  206. typedef struct
  207. {
  208. cmObj obj;
  209. cmScH_t scH; //
  210. unsigned locN; //
  211. cmScMatchLoc_t* loc; // loc[locN]
  212. unsigned mrn; // max row count (midi)
  213. unsigned rn; // cur row count
  214. unsigned mcn; // max column count (score)
  215. unsigned cn; // cur column count
  216. unsigned mmn; // max length of midiBuf[] (mrn-1)
  217. unsigned msn; // max length of score window (mcn-1)
  218. cmScMatchVal_t* m; // m[mrn,mcn] DP matrix
  219. unsigned pn; // mrn+mcn
  220. cmScMatchPath_t* p_mem; // pmem[ 2*pn ];
  221. cmScMatchPath_t* p_avl; // available path record linked list
  222. cmScMatchPath_t* p_cur; // current path linked list
  223. cmScMatchPath_t* p_opt; // p_opt[pn] current best alignment
  224. double opt_cost; // p_opt cost set by cmScMatchExec()
  225. } cmScMatch;
  226. cmScMatch* cmScMatchAlloc( cmCtx* c, cmScMatch* p, cmScH_t scH, unsigned maxScWndN, unsigned maxMidiWndN );
  227. cmRC_t cmScMatchFree( cmScMatch** pp );
  228. cmRC_t cmScMatchInit( cmScMatch* p, cmScH_t scH, unsigned maxScWndN, unsigned maxMidiWndN );
  229. cmRC_t cmScMatchFinal( cmScMatch* p );
  230. // Returns cmEofRC if scLocIdx + locN > p->locN - note that this is not necessarily an error.
  231. // The optimal path p_opt[] will only be updated if the edit cost is less than min_cost.
  232. // Set min_cost to DBL_MAX to force p_opt[] to be updated.
  233. cmRC_t cmScMatchExec( cmScMatch* p, unsigned scLocIdx, unsigned locN, const unsigned* midiPitchV, unsigned midiPitchN, double min_cost );
  234. //=======================================================================================================================
  235. typedef struct
  236. {
  237. unsigned locIdx; // location assoc'd with this MIDI evt (cmInvalidIdx if not a positive-match)
  238. unsigned cbCnt; // count of times this event has been sent via the callback
  239. unsigned mni; // unique identifier for this event since previous call to cmScAlignReset().
  240. unsigned smpIdx; // time stamp of this event
  241. unsigned pitch; // MIDI note pitch
  242. unsigned vel; // " " velocity
  243. } cmScMatcherMidi_t;
  244. typedef struct
  245. {
  246. unsigned locIdx;
  247. unsigned mni;
  248. unsigned pitch;
  249. unsigned vel;
  250. bool tpFl; // true positive
  251. bool fpFl; // false positive
  252. } cmScMatcherResult_t;
  253. typedef struct
  254. {
  255. cmObj obj;
  256. cmScMatch* mp;
  257. unsigned mn;
  258. cmScMatcherMidi_t* midiBuf; // midiBuf[mn]
  259. cmScMatcherResult_t* res; // res[rn]
  260. unsigned rn; // length of res[]
  261. unsigned ri; // next avail res[] recd.
  262. double s_opt; //
  263. unsigned missCnt; // count of consecutive trailing non-matches
  264. unsigned esi; // index into loc[] of the last positive match.
  265. unsigned mni; // track the count of MIDI events since the last call to cmScMatcherReset()
  266. unsigned mbi; // index of oldest MIDI event in midiBuf[]; 0 when the buffer is full.
  267. unsigned begSyncLocIdx; // start of score window, in mp->loc[], of best match in previous scan
  268. unsigned stepCnt; // count of forward/backward score loc's to examine for a match during cmScMatcherStep().
  269. unsigned maxMissCnt; // max. number of consecutive non-matches during step prior to executing a scan.
  270. unsigned scanCnt; // count of time scan was executed inside cmScMatcherStep()
  271. } cmScMatcher;
  272. cmScMatcher* cmScMatcherAlloc( cmCtx* c, cmScMatcher* p, double srate, cmScH_t scH, unsigned scWndN, unsigned midiWndN );
  273. cmRC_t cmScMatcherFree( cmScMatcher** pp );
  274. cmRC_t cmScMatcherInit( cmScMatcher* p, double srate, cmScH_t scH, unsigned scWndN, unsigned midiWndN );
  275. cmRC_t cmScMatcherFinal( cmScMatcher* p );
  276. void cmScMatcherReset( cmScMatcher* p );
  277. bool cmScMatcherInputMidi( cmScMatcher* p, unsigned smpIdx, unsigned status, cmMidiByte_t d0, cmMidiByte_t d1 );
  278. // Slide a score window scanCnt times, beginning at 'bsi',
  279. // looking for the best match to p->midiBuf[]. The score window
  280. // contain scWndN (p->mp->mcn-1) score locations.
  281. // Returns the index into p->mp->loc[] of the start of the best
  282. // match score window. The score associated
  283. // with this match is stored in s_opt.
  284. unsigned cmScMatcherScan( cmScMatcher* p, unsigned bsi, unsigned scanCnt );
  285. // Step forward/back by p->stepCnt from p->esi.
  286. // p->esi must therefore be valid prior to calling this function.
  287. // If more than p->maxMissCnt consecutive MIDI events are
  288. // missed then automatically run cmScAlignScan().
  289. // Return cmEofRC if the end of the score is encountered.
  290. // Return cmSubSysFailRC if an internal scan resync. failed.
  291. cmRC_t cmScMatcherStep( cmScMatcher* p );
  292. cmRC_t cmScMatcherExec( cmScMatcher* p, unsigned smpIdx, unsigned status, cmMidiByte_t d0, cmMidiByte_t d1 );
  293. //=======================================================================================================================
  294. enum
  295. {
  296. kSaMinIdx,
  297. kSaSubIdx, // 'substitute' - may or may not match
  298. kSaDelIdx, // 'delete' - delete a MIDI note
  299. kSaInsIdx, // 'insert' - insert a space in the score
  300. kSaCnt
  301. };
  302. // Dynamic Programming (DP) matrix element
  303. typedef struct
  304. {
  305. unsigned v[kSaCnt]; //
  306. bool matchFl; // if this is a substitute; is it also a match?
  307. bool transFl; // if this is a substitute; is this the second element in a reversed pair?
  308. } cmScAlignVal_t;
  309. // List record used to track a path through the DP matrix p->m[,]
  310. typedef struct cmScAlignPath_str
  311. {
  312. unsigned code;
  313. unsigned ri;
  314. unsigned ci;
  315. bool matchFl;
  316. bool transFl;
  317. unsigned locIdx;
  318. struct cmScAlignPath_str* next;
  319. } cmScAlignPath_t;
  320. // Score note event record
  321. typedef struct
  322. {
  323. unsigned pitch;
  324. } cmScAlignScEvt_t;
  325. // Score location record.
  326. typedef struct
  327. {
  328. unsigned evtCnt; //
  329. cmScAlignScEvt_t* evtV; // evtV[evtCnt]
  330. unsigned scLocIdx; // scH score location index
  331. int barNumb; // bar number of this location
  332. } cmScAlignLoc_t;
  333. typedef struct
  334. {
  335. unsigned locIdx; // location assoc'd with this MIDI evt (cmInvalidIdx if not a positive-match)
  336. unsigned cbCnt; // count of times this event has been sent via the callback
  337. unsigned mni; // unique identifier for this event since previous call to cmScAlignReset().
  338. unsigned smpIdx; // time stamp of this event
  339. unsigned pitch; // MIDI note pitch
  340. unsigned vel; // " " velocity
  341. } cmScAlignMidiEvt_t;
  342. typedef struct
  343. {
  344. unsigned locIdx; // loc[] sync. location
  345. unsigned smpIdx; //
  346. unsigned mni; // MIDI event unique index
  347. unsigned pitch; // MIDI event pitch which may not match the score event pitch
  348. unsigned vel; // " " velocity
  349. bool matchFl;
  350. bool transFl;
  351. bool foundFl;
  352. } cmScAlignResult_t;
  353. //
  354. typedef void (*cmScAlignCb_t)( void* cbArg, unsigned scLocIdx, unsigned mni, unsigned pitch, unsigned vel );
  355. typedef struct
  356. {
  357. cmObj obj;
  358. cmScAlignCb_t cbFunc; //
  359. void* cbArg; //
  360. cmScH_t scH; //
  361. double srate; //
  362. unsigned locN; // length of loc[]
  363. cmScAlignLoc_t* loc; // loc[locN] score array
  364. unsigned rn; // length of midiBuf[] (mn+1)
  365. unsigned cn; // length of score window (scWndN+1)
  366. unsigned mn; // length of midiBuf[] (rn-1)
  367. cmScAlignMidiEvt_t* midiBuf; // midiBuf[ mn ]
  368. unsigned mbi; // index of first element in midiBuf[] - this is required because the MIDI buf fills from the end to the beginning
  369. unsigned mni; // index of event in midiBuf[p->mn] - increments on each note inserted into midiBuf[] - zeroed by cmScAlignReset().
  370. cmScAlignVal_t* m; // m[rn,cn]
  371. unsigned pn; // rn+cn
  372. cmScAlignPath_t* p_mem; // pmem[ 2*pn ];
  373. cmScAlignPath_t* p_avl; // available path record linked list
  374. cmScAlignPath_t* p_cur; // current path linked list
  375. cmScAlignPath_t* p_opt; // p_opt[pn] current best alignment
  376. double s_opt; // score of the current best alignment
  377. unsigned esi; // loc[] index of latest positive match
  378. unsigned missCnt; // count of consecutive trailing MIDI events without positive matches
  379. unsigned scanCnt;
  380. bool printFl;
  381. unsigned begScanLocIdx; // begin the search at this score locations scWnd[begScanLocIdx:begScanLocIdx+p->cn-1]
  382. unsigned begSyncLocIdx; // initial sync location
  383. unsigned resN; // count of records in res[] == 2*cmScoreEvtCount()
  384. cmScAlignResult_t* res; // res[resN]
  385. unsigned ri; //
  386. int stepCnt; // count of loc[] locations to step ahead/back during a cmScAlignStep() operation.
  387. int maxStepMissCnt; // max. consecutive trailing non-positive matches before a scan takes place.
  388. } cmScAlign;
  389. cmScAlign* cmScAlignAlloc( cmCtx* ctx, cmScAlign* p, cmScAlignCb_t cbFunc, void* cbArg, cmReal_t srate, cmScH_t scH, unsigned midiN, unsigned scWndN );
  390. cmRC_t cmScAlignFree( cmScAlign** pp );
  391. cmRC_t cmScAlignInit( cmScAlign* p, cmScAlignCb_t cbFunc, void* cbArg, cmReal_t srate, cmScH_t scH, unsigned midiN, unsigned scWndN );
  392. cmRC_t cmScAlignFinal( cmScAlign* p );
  393. void cmScAlignReset( cmScAlign* p, unsigned begScanLocIdx );
  394. cmRC_t cmScAlignExec( cmScAlign* p, unsigned smpIdx, unsigned status, cmMidiByte_t d0, cmMidiByte_t d1 );
  395. bool cmScAlignInputMidi( cmScAlign* p, unsigned smpIdx, unsigned status, cmMidiByte_t d0, cmMidiByte_t d1 );
  396. // Scan from p->begScanLocIdx to the end of the score looking
  397. // for the best match to p->midiBuf[].
  398. // Returns the score location index which best matches the
  399. // first note p->midiBuf[]. The score associated
  400. // with this match is stored in s_opt.
  401. unsigned cmScAlignScan( cmScAlign* p, unsigned scanCnt );
  402. // Step forward/back by p->stepCnt from p->esi.
  403. // If more than p->maxStepMissCnt consecutive MIDI events are
  404. // missed then automatically run cmScAlignScan().
  405. // Return cmEofRC if the end of the score is encountered.
  406. // Return cmSubSysFailRC if an internal scan resync. failed.
  407. cmRC_t cmScAlignStep( cmScAlign* p );
  408. unsigned cmScAlignScanToTimeLineEvent( cmScMatcher* p, cmTlH_t tlH, cmTlObj_t* top, unsigned endSmpIdx );
  409. // Given a score, a time-line, and a marker on the time line scan the
  410. // entire score looking for the best match between the first 'midiN'
  411. // notes in each marker region and the score.
  412. void cmScAlignScanMarkers( cmRpt_t* rpt, cmTlH_t tlH, cmScH_t scH );
  413. //=======================================================================================================================
  414. typedef struct
  415. {
  416. unsigned mni;
  417. unsigned locIdx;
  418. unsigned pitch;
  419. unsigned vel;
  420. unsigned smpIdx;
  421. } cmScMeasMidi_t;
  422. typedef struct
  423. {
  424. cmScoreSet_t* set; // A pointer to defining score set
  425. unsigned bli; // Begin index into sap->loc[].
  426. unsigned eli; // End index into sap->loc[].
  427. unsigned bmi; // Begin index into midi[].
  428. unsigned emi; // End index into midi[].
  429. double* val; // val[sap->eleCnt]
  430. } cmScMeasSet_t;
  431. typedef struct
  432. {
  433. cmObj obj;
  434. cmScAlign* sap;
  435. unsigned mn;
  436. cmScMeasMidi_t* midi;
  437. } cmScMeas;
  438. cmScMeas* cmScMeasAlloc( cmCtx* c, cmScMeas* p, double srate, cmScH_t scH );
  439. cmRC_t cmScMeasFree( cmScMeas** pp );
  440. cmRC_t cmScMeasInit( cmScMeas* p, double srate, cmScH_t scH );
  441. cmRC_t cmScMeasFinal( cmScMeas* p );
  442. cmRC_t cmScMeasExec( cmScMeas* p, unsigned smpIdx, unsigned status, cmMidiByte_t d0, cmMidiByte_t d1, unsigned scLocIdx );
  443. #ifdef __cplusplus
  444. }
  445. #endif
  446. #endif