diff --git a/README.md b/README.md
index 73ab0e7..e6825d2 100644
--- a/README.md
+++ b/README.md
@@ -1,2 +1,21 @@
 # Journal-Utilities
 Utilities and Documentation for creating contents for the Active Inference Journal
+
+(A) The Python scripts
+(1) invoke OpenAI Whisper Cloud service, and reformat the output to CSV.
+Invocation from local Linux command line. (The suffixed "&" makes each python invocation run in background. Each instance of the process polls OpenAI every two minutes, and kicks off the four steps of the Extract-and-save phase of processing when main processing of its request has completed or failed.)  
+python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/SubmitToCloudWhisper.py" "ls039-0" "http://crisiscenter.us/AILab01/2022Livestreams" "ActInf Livestream 039.0 ~ 'Morphogenesis as Bayesian inference'.m4a" | tee mass_ls039-0.m4a.json &
+python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/SubmitToCloudWhisper.py" "ls039-1" "http://crisiscenter.us/AILab01/2022Livestreams" "ActInf Livestream 039.1 ~ 'Morphogenesis as Bayesian inference'.m4a" | tee mass_ls039-1.m4a.json &
+python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/SubmitToCloudWhisper.py" "ls039-2" "http://crisiscenter.us/AILab01/2022Livestreams" "ActInf Livestream 039.2 ~ 'Morphogenesis as Bayesian inference'.m4a" | tee mass_ls039-2.m4a.json &
+
+(2) extracts speech and context data from the new local CSVs, and create a simple text file that can be manually imported into a word processor and formatted with Title, Heading 1 (session), Heading 2 (speakers, contents, transcript).
+
+
+(B) The CSV should be filled out manually using any spreadsheet program.
+These data are read by sentencesToTranscripts script, so the latter can convert Whisper-generated speaker labels "A" "B"... into "Daniel" "Bleu"...
+Even if AllSpeakers.csv is correct, the raw, editable .txt file may still have to have Speaker adjusted - this happens when Whisper gets confused about accents or prosody.
+
+
+--------
+
+Initial Scripts 1 & 2, and initial README contributed by Dave Douglass, November 2022. 
diff --git a/Scripts/1_SubmitToCloudWhisper.py b/Scripts/1_SubmitToCloudWhisper.py
new file mode 100644
index 0000000..f29946d
--- /dev/null
+++ b/Scripts/1_SubmitToCloudWhisper.py
@@ -0,0 +1,1524 @@
+#! ...python3
+#cd "/mnt/d/Documents/FEP-AI/2022 Livestreams/Mass 2022 Livestreams"
+    #python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/SubmitToCloudWhisper.py" ls048-1 "http://crisiscenter.us/AILab01/2022Livestreams" "ls048-1.m4a" | tee ls048-1.m4a.json &
+    # myID['ls048-0']= "rx1rvgss4t-2e6c-46ee-a0d4-42777283a9b1"
+    # myID['ls048-1']= 'rxytoplp16-7b8b-41a6-be1b-78a0a837d8d4'
+
+#cd "/mnt/d/Documents/FEP-AI/2022 ModelStream/mo007/resubmit"   rxzfu6wsa1-06f3-4028-8bf7-355d7f61eb00
+    #python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/SubmitToCloudWhisper.py" mo007-1 "http://crisiscenter.us/AILab01/2022Livestreams" "mo007-1.m4a" | tee mo007-1.m4a.json &
+
+# D:\Documents\FEP-AI\2022 Livestreams\ActInf Livestream #036 Modeling Ourselves\ls036-1>"D:\Program Files\LibreOffice\program\soffice.exe" --help
+
+#D:\Documents\FEP-AI\Active Inference Podcast\Transcribe via Whisper.json
+#call with python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/Transcribe via Whisper.py" ls037-0 "http://crisiscenter.us/AILab01/2022Livestreams" "ls037-0.m4a"	rs3z2z81w6-4507-4918-b001-7c08ebad22a6
+#call with python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/Transcribe via Whisper.py" ls037-1 "http://crisiscenter.us/AILab01/2022Livestreams" "ls037-1.mp3" | tee ls037-1.mp3.json	rsury59afm-90b2-4049-9d08-cbb116e36808
+#cd /mnt/d/Documents/FEP-AI/2022 Livestreams/ActInf Livestream #037 Stephen Mann - Free Energy A User's Guide/ls037-2
+    #python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/SubmitToCloudWhisper.py" ls037-2 "http://crisiscenter.us/AILab01/2022Livestreams" "ls037-2.m4a" | tee ls037-2.m4a.json	
+#cd /mnt/d/Music/Fugs
+   #python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/SubmitToCloudWhisper.py" PBF "http://crisiscenter.us/misc" "DrStrangelovePreciousBodilyFluids.m4a" | tee PBF.m4a.json rsuh9skgre-a056-486e-8138-2e6608d21f04
+#cd "/mnt/d/Documents/FEP-AI/2022 Livestreams/ActInf Livestream #040 - Chris Fields... A free energy principle for generic quantum systems/ls040-1"
+#   python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/SubmitToCloudWhisper.py" ls040-1 "http://crisiscenter.us/AILab01/2022Livestreams" "ls040-1.m4a" | tee ls040-1.m4a.json
+
+#cd "/mnt/d/Documents/FEP-AI/2022 Livestreams\ActInf Livestream #041 - Axel Constant - Extended Active Inference beyond Skulls/ls040-1"
+#   python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/SubmitToCloudWhisper.py" ls041-1 "http://crisiscenter.us/AILab01/2022Livestreams" "ls041-1.m4a" | tee ls041-1.m4a.json
+#cd "/mnt/d/Documents/FEP-AI/2022 Livestreams/ls042/ls042-0"
+#   python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/SubmitToCloudWhisper.py" ls042-0 "http://crisiscenter.us/AILab01/2022Livestreams" "ls042-0.m4a" | tee ls042-0.m4a.json
+
+
+# For more logic, see "Transcribe ls036 Modelling ourselves.txt" in "D:\Documents\FEP-AI\2022 Livestreams\ActInf Livestream #036 Modeling Ourselves"
+
+import requests
+import time
+import sys
+import math
+import csv
+import json
+
+#call with python3 - BerlinSym2021KJFKey "http://crisiscenter.us/AILab01/Karl_Friston_Applied_Active_Inference_Symposium_2021-06-22" "Quadrille.wav"
+#call with python3 - quadriTest "http://crisiscenter.us/AILab01/Karl_Friston_Applied_Active_Inference_Symposium_2021-06-22" "Quadrille.wav"	rzw49dpr1n-4856-4172-adf4-e502720c93de
+
+#call with python3 - ls051-0 "http://crisiscenter.us/AILab01/2022Livestreams" "ls051-0.wav"	rskfsnu6hj-8e56-4c7d-a4d1-76aa04ab873a
+#call with python3 - ls051-0-2 "http://crisiscenter.us/AILab01/2022Livestreams" "ls051-0-2.mp3"	rsk599qwnx-7e0e-49c2-bafd-8cb0ad4745db
+
+#python3 - ls036-0 "http://crisiscenter.us/AILab01/2022Livestreams" "ls036-0.m4a"
+#call with python3 - ls036-2 "http://crisiscenter.us/AILab01/2022Livestreams" "ls036-2.m4a"	
+
+if __name__ == "__main__":
+    print(f'Arguments count: {len(sys.argv)}')
+    if len(sys.argv) < 3:
+        print("Need at least docLabel, onlinePath, and onlineFile; exiting!")
+        quit()
+    
+
+#for i, arg in enumerate(sys.argv):
+#    print(f'Argument {i:>6}: {arg}')
+
+docLabel = sys.argv[1]
+onlinePath = sys.argv[2]
+onlineFile = sys.argv[3]
+print("docID, onlinePath, onlineFile " + "'" + docLabel + "', '" +  onlinePath + "', '" + onlineFile + "'")
+if len(sys.argv) > 4:
+    outputPath = sys.argv[4]
+    print("outputPath: " + "'" + outputPath + "'")
+
+
+
+# ---------------------
+
+
+def ToDisplayTime(tt):
+    ts=float(tt)
+    h0=int(ts/3600000.0)
+    hh=""
+    if h0 > 9:
+        hh = str(100+h0)
+        hh = hh[1:3] + ":"
+    elif h0 > 0:
+        hh = str(h0) + ":"
+    
+    m0=int( (ts-(3600000.0*h0))/60000.0)
+    mm=str(100+m0)
+    s0=int( (ts - (3600000.0*h0) - (60000.0*m0) ) /1000.0)
+    ss=str(100+s0)
+    to_time= hh + mm[1:3] + ":" + ss[1:3]
+    return to_time
+
+
+def ToSRTTime(tt):
+    ts=float(tt)
+    h0=int(ts/3600000.0)
+    hh = str(100+h0)
+    m0=int( (ts-(3600000.0*h0))/60000.0)
+    mm=str(100+m0)
+    s0=int( (ts - (3600000.0*h0) - (60000.0*m0) ) /1000.0)
+    ss=str(100+s0)
+    mms0=int(ts - (3600000.0*h0) - (6000*m0) - s0)
+    mms=str(1000+mms0)
+    to_time= hh[1:3] + ":" + mm[1:3] + ":" + ss[1:3] + "," + mms[1:4]
+    return to_time
+
+
+
+# ---------------------
+
+
+#"audio_url": " + onlinePath + "/" + onlineFile + ",
+#"audio_url": "http://crisiscenter.us/AILab01/Karl_Friston_Applied_Active_Inference_Symposium_2021-06-22/Quadrille.wav",
+
+endpoint = "https://api.assemblyai.com/v2/transcript"
+audio_url = onlinePath + "/" + onlineFile
+
+#    "speaker_labels": True,
+
+# for a fatter list - one containing an error - see "SubmitToCloudWhisper - Copy (13) - Try word_boost, spell again.py"
+
+json = {
+    "audio_url": audio_url,
+    "word_boost": ['a priori',
+'Aaron Fath',
+'Aaron J Fath',
+'Abbas Edalat',
+'accuracy',
+'ActInf Lab',
+'ActInf Livestream',
+'ActInf',
+'ActInf Lab project',
+'ActInf Lab Livestream',
+'Active Inference Livestream',
+'ActInf Lab GuestStream',
+'ActInf Lab OrgStream',
+'Active Inference GuestStream',
+'Active Inference OrgStream',
+'ActInf Lab OrgStream',
+'Active Inference ModelStream',
+'ActInf Lab ModelStream',
+'Active Inference MathStream',
+'ActInf Lab MathStream',
+'action oriented representation',
+'action planning',
+'action prediction',
+'action',
+'Active Inference Institute',
+'Active Inference Lab',
+'Active Inference',
+'active states',
+'active',
+'activity',
+'Adam Linson',
+'Adam Safron',
+'Adam Safron',
+'adaptive',
+'address',
+'Adeel Razi',
+'advantage function',
+'affect',
+'affordance',
+'agency',
+'agent',
+'agreement',
+'Aikaterini Fotopoulou',
+'Alessandra Pedrocchi',
+'Alex Kiefer',
+'Alexander Strobel',
+'align',
+'allostasis',
+'allostat',
+'ambiguity',
+'Amir Omidvarnia',
+'ancestral',
+'Andrea Gajardo Vidal',
+'Andreas Kleinschmidt',
+'Andrew Corcoran',
+'Andrew W Corcoran',
+'Anna Belardinelli',
+'Annemie Ploeger',
+'Anthony Chen',
+'Anthony G Chen',
+'Anthony Zador',
+'and',
+'ants',
+'ant',
+'anxiety',
+'architectures',
+'Ari E Kahn',
+'Ari Kahn',
+'Arnold Pfeffer',
+'aspects',
+'assumptions',
+'asymmetry',
+'attention',
+'Attial',
+'attributes',
+'awareness',
+'Axel Constant',
+'bacterium like',
+'Ballard',
+'Bart Dhoedt',
+'Bayesian inference',
+'Bayesian statistics physics',
+'Bayesian',
+'behavior',
+'belief updating',
+'belief',
+'beliefs',
+'Bellman equation',
+'Bellman',
+'Beni',
+'Benjamin Illingworth',
+'Benucci',
+'Bert de Vries',
+'Bert de Vries',
+'Bijan',
+'bioelectric',
+'biological',
+'Biology and Philosophy',
+'biology',
+'Bitcoin',
+'blanket states',
+'Blei',
+'Bleu',
+'blueprint',
+'bottom up',
+'Botvinick',
+'boundary',
+'brain architecture',
+'brain evolution',
+'brain',
+'Brea',
+'Bull',
+'Buzsaki',
+'Canada',
+'canonical',
+'capacity curve',
+'Carnap',
+'Casper Hesp',
+'Cathy J Price',
+'Cathy Price',
+'Chang Kim',
+'Chang Sub Kim',
+'Chantelle Gaylor',
+'Chantelle M Gaylor',
+'chaos',
+'Charles C H Hong',
+'Christian Guckelsberger',
+'Christoph Mathys',
+'Christoph Salge',
+'Christopher D Frith',
+'Christopher Frith',
+'Christopher Lynn',
+'Christopher W Lynn',
+'Beren Milledge', 
+'Anil Seth',
+'Calgary',
+'Christopher L. Buckley',
+'Claudia Clopath',
+'Clopath',
+'Coda',
+'cognition',
+'cognitive niche',
+'cognitive science',
+'cognitive studies',
+'cognitive',
+'coherence',
+'coherent',
+'comma',
+'communication',
+'competition',
+'complexity',
+'computational',
+'computer',
+'concept',
+'concepts',
+'connectivity',
+'Conor Heins',
+'Conor',
+'continuum',
+'control error',
+'control theory',
+'control',
+'controlled process',
+'controller',
+'controls',
+'conversation',
+'Conway',
+'correlation',
+'Costa',
+'counterfactuals',
+'COVID',
+'cue',
+'culture',
+'cybernetics',
+'cycle',
+'D Maisto',
+'DAG',
+'DAGs',
+'Daniel Polani',
+'Daniel Williams',
+'Daniel',
+'Danielle Bassett',
+'Danielle de Kerckhove',
+'Danielle Kerckhove',
+'Danielle S Bassett',
+'Daphne Demekas',
+'Daphne',
+'Dario Cuevas Rivera',
+'Dario Cuevas Rivera',
+'Dario Rivera',
+'data',
+'Dauwels',
+'David Benrimoh',
+'David Benton',
+'David Cittern',
+'David Green',
+'David Krakauer',
+'David McKay',
+'David W Green',
+'Dayan',
+'DCM',
+'de Vries',
+'Dean',
+'Declan Lewis',
+'Deneve',
+'Dennett',
+'Diana Morelen',
+'differentiate',
+'dimension',
+'Dimitrije Markovi',
+'Dirichlet',
+'distinctions',
+'disturbance',
+'domain',
+'Dot EDU',
+'Dot One',
+'Dot Two',
+'Dutch',
+'dynamics',
+'Earle Jamieson',
+'ecological',
+'Edda Bilek',
+'Edelman',
+'Eirik Sovik',
+'Elenora Guanziroli',
+'emergence',
+'Emmanuel Dauce',
+'Emmanuel Dauce',
+'enactivism',
+'encoding',
+'endstopping',
+'energy',
+'English',
+'ensemble',
+'Ensor Palacios',
+'Ensor Rafael Palacios',
+'entorhinal',
+'environment',
+'enzymes',
+'epistemic value',
+'ergodicity',
+'Erik Rietveld',
+'errors',
+'Ettore Ambrosini',
+'evidence',
+'evolution',
+'Evolutionary Anthropology',
+'exafferent',
+'examples',
+'expectation',
+'expected free energy',
+'exploration',
+'explore',
+'external states',
+'exteroception',
+'Fabienne Picard',
+'Fabrice Bartolomei',
+'Faisal Mushtaq',
+'feedback control',
+'feedback',
+'Felix A Pollock',
+'Felix Pollock',
+'Feynman',
+'field',
+'fitness',
+'flagella',
+'Florian Ott',
+'flow',
+'fMRI imaging',
+'fMRI',
+'force',
+'foraging',
+'forage',
+'forward model',
+'framework',
+'Francesco Donnarumma',
+'Francesco Rigoli',
+'Franco Molteni',
+'Franz Kuchling',
+'Frederike H Petzschner',
+'Frederike Petzschner',
+'Free Energy Principle',
+'free energy',
+'free',
+'Friston blanket',
+'Friston',
+'function',
+'gain',
+'generalized capacity curve',
+'generalized free energy',
+'generative model',
+'generative models',
+'generative process',
+'Geoffrey Bingham',
+'Georgi Georgiev',
+'Geraint Rees',
+'Gerry Edelman',
+'Giovanni Pezzulo',
+'Giuseppe Pagnoni',
+'goal directed',
+'goal',
+'Graeme D Jackson',
+'Graeme Jackson',
+'graph',
+'Grigorios A Pavliotis',
+'Grigorios Pavliotis',
+'group',
+'Guido Hesselmann',
+'Hae Jeong Park',
+'Hae Park',
+'Harrison',
+'Hayley A Young',
+'Hayley Young',
+'Hebbian',
+'Helene Haker',
+'Helmholtz Decomposition',
+'Helmholtzian',
+'Helmholtz',
+'heuristic',
+'hidden states',
+'Hideaki',
+'hierarchical model',
+'Hinton',
+'Hipolito',
+'Hohwy',
+'homeostatic',
+'homeostat',
+'Hugo Bottemanne',
+'Brennan',
+'Alexander Tschantz',
+'Iain Couzin',
+'idea',
+'image',    
+'implication',
+'inclination',
+'increase',
+'independent',
+'individual',
+'individuals',
+'indoctrination',
+'Ines Hipolito',
+'Ines',
+'inference',
+'influence',
+'information geometry',
+'information',
+'informational',
+'interactions',
+'interface',
+'internal model',
+'internal representation',
+'internal states',
+'interoception',
+'interoceptive',
+'interpretation',
+'inverse model',
+'Isomura',
+'Jablonka',
+'Jack Brookes',
+'Jakob Hohwy',
+'Jakub Limanowski',
+'Jakub Smekal',
+'Jakub',
+'James C Harris',
+'James Cooke',
+'James E Cooke',
+'James E Swain',
+'James Fallon',
+'James H Fallon',
+'James Harris',
+'James Swain',
+'James Whittington',
+'Tolman Eichenbaum Machine',
+'Javier Sanchez Canizares',
+'Jean Decety',
+'Jelle Bruineberg',
+'Jelle',
+'Jiyoung Kang',
+'Johannes Lohmann',
+'John Doherty',
+'John O Doherty',
+'Jonathan P Roiser',
+'Jonathan Roiser',
+'Judea Pearl',
+'Jun Tani',
+'Justyna Ekert',
+'Justyna O Ekert',
+'Kai Ueltzhoffer',
+'Kant',
+'Kappel',
+'Karl Friston',
+'Karl J Friston',
+'Karl',
+'Katherine L Rosenblum',
+'Katherine Rosenblum',
+'Khezri',
+'Kilner',
+'Kirchhoff',
+'Klaas E Stephan',
+'Klaas Stephan',
+'Kuchling',
+'Kuhn',
+'Laje',
+'Lamme',
+'Lancelot Costa',
+'Lancelot Da Costa',
+'Lancelot',
+'language',
+'Lars Muckli',
+'Laurence J Kirmayer',
+'Laurence Kirmayer',
+'Laurent Perrinet',
+'learning',
+'least action',
+'least',
+'leave it to',
+'leave to',
+'left it to',
+'left to',
+'Leipzig',
+'levels',
+'Lieke de Boer',
+'Lilian A E Weber',
+'linguistics department',
+'Linsker',
+'Lisa Barrett',
+'Lisa Feldman Barrett',
+'living system',
+'local',
+'Lorenzo Niero',
+'loss function',
+'Lyapunov',
+'M Berk Mirza',
+'M Mirza',
+'macaque',
+'Maell Cullen',
+'Mahault Albarracin',
+'Majid Beni',
+'Majid D Beni',
+'Majid',
+'Mangor Pedersen',
+'Manuel Baltieri',
+'Marc Tittgemeyer',
+'Marcello Costantini',
+'Maria Muzik',
+'Mark Mon Williams',
+'Mark Solms',
+'Mark Williams',
+'Markov blanket',
+'Markov decision process',
+'Markov',
+'Marolla',
+'Marta Gandolla',
+'Martin Biehl',
+'Martin Butz',
+'Martin V Butz',
+'Martin Voss',
+'match.com',
+'material',
+'maths',
+'MATLAB',
+'Matthew M Nour',
+'Matthew Nour',
+'Mattia Veronese',
+'Max Planck',
+'Maxwell J D Ramstead',
+'Maxwell Ramstead',
+'maze',
+'measurement noise',
+'measurement',
+'membrane',
+'mesoanatomical',
+'metacognition',
+'Micah Allen',
+'Michael Kirchhoff',
+'Michael Levin',
+'Michael Moutoussis',
+'Michael Weisberg',
+'Michael',
+'Mike Levin',
+'Milledge',
+'mind',
+'minimization',
+'minimizing',
+'model based',
+'model selection',
+'model',
+'modelers',
+'modularity',
+'Moser',
+'multimodal expansion',
+'multimodal',
+'multiple',
+'narrative',
+'Nathaniel Nyema',
+'neoplasia',
+'neuroimaging',
+'neuromodulator',
+'niche',
+'Nick S Ward',
+'Nick Ward',
+'noise',
+'nonclassical',
+'Noor Sajid',
+'novelty',
+'numbers',
+'objective function',
+'observation',
+'Oliver D Howes',
+'Oliver Howes',
+'Olivier Sigaud',
+'Omar Khachouf',
+'Omar T Khachouf',
+'online',
+'ontology',
+'operating point',
+'operations',
+'order',
+'OrgStream',
+'overload',
+'overridable',
+'Ozan Catal',
+'parse',
+'partial',
+'participants',
+'particle',
+'Pasco Fearon',
+'Patrice Duquette',
+'Patrick Connolly',
+'Paul B Badcock',
+'Paul Badcock',
+'Paul Fletcher',
+'Peirce',
+'perception',
+'performance',
+'perspective',
+'perturbation',
+'Peter Bossaerts',
+'Peter Culmer',
+'Peter Uhlhaas',
+'Peter Vincent',
+'Pezzulo',
+'phase',
+'Philipp Schwartenbeck',
+'Philipp Sterzer',
+'philosophy',
+'phyletic gradualism',
+'physics',
+'physiological',
+'Piaget',
+'plant',
+'plasticity',
+'play',
+'policy selection',
+'policy',
+'polyethism',
+'POMDP',
+'position',
+'possibility',
+'posterior',
+'pragmatic value',
+'pragmatics',
+'pragmatism',
+'prediction error',
+'prediction',
+'Predictive Coding',
+'predictive processing',
+'predictive regulation',
+'Predrag Petrovic',
+'preference',
+'principle',
+'prior',
+'probabilistic graphical model',
+'process noise',
+'process theory',
+'processes',
+'processing',
+'professional setting',
+'program',
+'prompting',
+'punctuated equilibrium',
+'pymdp',
+'conor',
+'quantum',
+'question',
+'questions',
+'Quigley',
+'radical enactivist',
+'Rao and Ballard',
+'Raphael Kaplan',
+'Raymond Dolan',
+'Raymond J Dolan',
+'reafferent',
+'reality',
+'realize',
+'recognition model',
+'recognition',
+'reference distribution',
+'reference trajectory',
+'reflective',
+'refrigerator',
+'regime of attention',
+'regulated resource',
+'relationships',
+'representation',
+'representational',
+'representationalism',
+'representations',
+'response curve',
+'Richard E Rosch',
+'Richard M Wilkie',
+'Richard Rosch',
+'Richard Wilkie',
+'Rick A Adams',
+'Rick Adams',
+'Riemann',
+'Robin Carhart Harris',
+'Robin Harris',
+'role',
+'Rosalyn J Moran',
+'Rosalyn Moran',
+'Ross',
+'Roy de Kleijn',
+'Roy Kleijn',
+'rules',
+'Rutger Goekoop',
+'Ryan Smith',
+'Ryota Kanai',
+'S Ho',
+'S Shaun Ho',
+'Saee Paliwal',
+'salience',
+'Samarth Swarup',
+'Samuel P L Veissiere',
+'Samuel Veissiere',
+'Sandra Iglesias',
+'saturation value',
+'scale',
+'scenario',
+'science',
+'section',
+'selection',
+'Sennesh',
+'sense states',
+'Sepideh Sadaghiani',
+'set point',
+'set',
+'settling point',
+'settling range',
+'Shaun Gallagher',
+'Shaun Ho',
+'Shimazaki',
+'Sillett',
+'Simon C Smith',
+'Simon Smith',
+'solenoidal ',
+'SPM',
+'stability',
+'state estimate',
+'state space',
+'state',
+'states',
+'stationarity',
+'Stefan J Kiebel',
+'Stefan Kiebel',
+'Stefano Poletti',
+'Stephen Fleming',
+'Stephen Fox',
+'Stephen Lawrie',
+'Stephen M Fleming',
+'Stephen M Lawrie',
+'Stephen Mann',
+'Stephen',
+'Sterling Street',
+'stigmergy',
+'stimuli',
+'stochastic optimal control',
+'stock',
+'story',
+'structure',
+'structures',
+'Sukhi Shergill',
+'surface',
+'surprise',
+'surround',
+'Sussillo',
+'switch',
+'synaptic',
+'system',
+'Takazumi Matsumoto',
+'Takuya Isomura',
+'Takuya',
+'Tarik Dahoun',
+'Taylor Series',
+'Taylor',
+'teacher',
+'teaching',
+'teleology',
+'temporal depth',
+'theorem',
+'theory',
+'Theriault',
+'thermodynamics of the brain',
+'thermodynamics',
+'Thomas Goschke',
+'Thomas H B FitzGerald',
+'Thomas Hope',
+'Thomas M Hope',
+'Thomas Parr',
+'thought',
+'threshold value',
+'Tim Gard',
+'Tim Verbelen',
+'Tim Verbelen',
+'time scales',
+'Timothy Behrens',
+'Tobias Nolte',
+'Toon Van de Maele',
+'top down',
+'topic',
+'Torigoe',
+'Toronto',
+'transfer function',
+'transfer',
+'transition',
+'truth',
+'Turrigiano',
+'uncertainty',
+'understanding',
+'University of Surrey',
+'value function',
+'variable',
+'variational free energy',
+'variational',
+'vehicles',
+'Veissiere',
+'viscerosensory signaling',
+'viscerosensory',
+'vision',
+'Vivien Ainley',
+'Wael Deredy',
+'Wael El Deredy',
+'wayfinding',
+'Yoshio Nakamura',
+'Zador',
+'zebra',
+'Zhang',
+'Zina M Manjaly',
+'Zina Manjaly' ],
+    "custom_spelling": [ {'from': ['actinf'], 'to': 'ActInf'},
+{'from': ['actinflab'], 'to': 'ActInfLab'},
+{'from': ['attial'], 'to': 'Attial'},
+{'from': ['ballard'], 'to': 'Ballard'},
+{'from': ['bayesian'], 'to': 'Bayesian'},
+{'from': ['bellman'], 'to': 'Bellman'},
+{'from': ['Benny','beni'], 'to': 'Beni'},
+{'from': ['beren','beran'], 'to': 'Beren'},
+{'from': ['millage','milledge'], 'to': 'Milledge'},
+{'from': ['anil'], 'to': 'Anil'},
+{'from': ['benucci'], 'to': 'Benucci'},
+{'from': ['Bijan'], 'to': 'Bijan'},
+{'from': ['bitcoin'], 'to': 'Bitcoin'},
+{'from': ['blei'], 'to': 'Blei'},
+{'from': ['bleu','Blue'], 'to': 'Bleu'},
+{'from': ['botvinick'], 'to': 'Botvinick'},
+{'from': ['brea'], 'to': 'Brea'},
+{'from': ['bull'], 'to': 'Bull'},
+{'from': ['buzsaki'], 'to': 'Buzsaki'},
+{'from': ['canada'], 'to': 'Canada'},
+{'from': ['carnap'], 'to': 'Carnap'},
+{'from': ['clopath'], 'to': 'Clopath'},
+{'from': ['coda'], 'to': 'Coda'},
+{'from': ['daphne','dakki'], 'to': 'Daphne'},
+{'from': ['conor','connor'], 'to': 'Conor'},
+{'from': ['demekas'], 'to': 'Demekas'},
+{'from': ['conway'], 'to': 'Conway'},
+{'from': ['costa'], 'to': 'Costa'},
+{'from': ['covid'], 'to': 'COVID'},
+{'from': ['dag'], 'to': 'DAG'},
+{'from': ['dags'], 'to': 'DAGs'},
+{'from': ['daniel'], 'to': 'Daniel'},
+{'from': ['dauwels'], 'to': 'Dauwels'},
+{'from': ['dayan'], 'to': 'Dayan'},
+{'from': ['dcm'], 'to': 'DCM'},
+{'from': ['dean'], 'to': 'Dean'},
+{'from': ['deneve'], 'to': 'Deneve'},
+{'from': ['dennett'], 'to': 'Dennett'},
+{'from': ['dirichlet'], 'to': 'Dirichlet'},
+{'from': ['dutch'], 'to': 'Dutch'},
+{'from': ['edelman'], 'to': 'Edelman'},
+{'from': ['english'], 'to': 'English'},
+{'from': ['feynman'], 'to': 'Feynman'},
+{'from': ['fmri'], 'to': 'fMRI'},
+{'from': ['Calfistan','fristen','friston','Tristan'], 'to': 'Friston'},
+{'from': ['harrison'], 'to': 'Harrison'},
+{'from': ['hebbian'], 'to': 'Hebbian'},
+{'from': ['hinds','hines'], 'to': 'Heins'},
+{'from': ['helmholtz'], 'to': 'Helmholtz'},
+{'from': ['hideaki'], 'to': 'Hideaki'},
+{'from': ['hinton'], 'to': 'Hinton'},
+{'from': ['hipolito'], 'to': 'Hipolito'},
+{'from': ['Howe','hohwy'], 'to': 'Hohwy'},
+{'from': ['brennan'], 'to': 'Brennan'},
+{'from': ['Chance'], 'to': 'Tschantz'},
+{'from': ['Ian'], 'to': 'Iain'},
+{'from': ['Cousin'], 'to': 'Couzin'},
+{'from': ['ines','Innes','inez'], 'to': 'Ines'},
+{'from': ['isomura'], 'to': 'Isomura'},
+{'from': ['jablonka'], 'to': 'Jablonka'},
+{'from': ['jelle'], 'to': 'Jelle'},
+{'from': ['kappel'], 'to': 'Kappel'},
+{'from': ['carl','Calf'], 'to': 'Karl'},
+{'from': ['Khezri'], 'to': 'Khezri'},
+{'from': ['kilner'], 'to': 'Kilner'},
+{'from': ['kirchhoff'], 'to': 'Kirchhoff'},
+{'from': ['kuchling'], 'to': 'Kuchling'},
+{'from': ['kuhn'], 'to': 'Kuhn'},
+{'from': ['laje'], 'to': 'Laje'},
+{'from': ['lamme'], 'to': 'Lamme'},
+{'from': ['lancelot'], 'to': 'Lancelot'},
+{'from': ['leipzig'], 'to': 'Leipzig'},
+{'from': ['linsker'], 'to': 'Linsker'},
+{'from': ['lyapunov'], 'to': 'Lyapunov'},
+{'from': ['majid'], 'to': 'Majid'},
+{'from': ['markov','markoff'], 'to': 'Markov'},
+{'from': ['marolla'], 'to': 'Marolla'},
+{'from': ['matlab'], 'to': 'MATLAB'},
+{'from': ['michael'], 'to': 'Michael'},
+{'from': ['moser'], 'to': 'Moser'},
+{'from': ['orgstream'], 'to': 'OrgStream'},
+{'from': ['pezzulo'], 'to': 'Pezzulo'},
+{'from': ['piaget', 'PSJA'], 'to': 'Piaget'},
+{'from': ['plank','Pluck'], 'to': 'Planck'},
+{'from': ['pineapple'], 'to': 'pymdp'},
+{'from': ['pomdp'], 'to': 'POMDP'},
+{'from': ['quigley'], 'to': 'Quigley'},
+{'from': ['riemann'], 'to': 'Riemann'},
+{'from': ['ross'], 'to': 'Ross'},
+{'from': ['sennesh'], 'to': 'Sennesh'},
+{'from': ['shimazaki'], 'to': 'Shimazaki'},
+{'from': ['sillett'], 'to': 'Sillett'},
+{'from': ['spm'], 'to': 'SPM'},
+{'from': ['stephen'], 'to': 'Stephen'},
+{'from': ['sussillo'], 'to': 'Sussillo'},
+{'from': ['takuya'], 'to': 'Takuya'},
+{'from': ['taylor'], 'to': 'Taylor'},
+{'from': ['theriault'], 'to': 'Theriault'},
+{'from': ['tolman'], 'to': 'Tolman'},
+{'from': ['torigoe'], 'to': 'Torigoe'},
+{'from': ['toronto'], 'to': 'Toronto'},
+{'from': ['turrigiano'], 'to': 'Turrigiano'},
+{'from': ['veissiere'], 'to': 'Veissiere'},
+{'from': ['zador'], 'to': 'Zador'},
+{'from': ['zhang'], 'to': 'Zhang'} ],
+    #"summarization": True,
+    #"summary_type": "bullets",
+    "speaker_labels": True,
+    "language_model": "medium",
+    "entity_detection": True,
+    "iab_categories": True,
+    "auto_chapters": True,
+    "sentiment_analysis": True,
+    "language_code": "en_us"
+}
+headers = {"authorization": "a14f484d11984e00bf7105cda4bc0c9a","content-type": "application/json"}
+response = requests.post(endpoint, json=json, headers=headers)
+#print(response.json())
+jj=response.json()
+myId=jj.get('id')
+print(myId)
+myStatus=jj.get('status')
+print(myStatus)
+time.sleep(30)
+
+
+import requests
+import time
+import sys
+import math
+import csv
+#myId = "rsuh9skgre-a056-486e-8138-2e6608d21f04"
+
+while myStatus == "queued" or myStatus == "processing":
+    time.sleep(120)
+    endpoint = "https://api.assemblyai.com/v2/transcript/" + myId
+    headers = {"authorization": "a14f484d11984e00bf7105cda4bc0c9a"}
+    response = requests.get(endpoint, headers=headers)
+    #print(response.json())
+    jj=response.json()
+    myStatus=jj.get('status')
+    print(myStatus)
+
+
+print()
+print()
+print("Dump JSON response:")
+print(jj)
+print()
+print(myId)
+print(myStatus)
+
+if myStatus != "completed":
+    myError = jj.get('error')
+    print()
+    print("Bad results from last main poll. Call if you find work.")
+    print(myError)
+    quit()
+
+# ----------- words (apparently always identical to those from paragraphs) ----------
+
+
+wordFileName = docLabel + "_" + onlineFile + ".words.csv"
+#wwf = open(wordFileName, "w")
+
+#words = jj.get('words')
+
+#for count, word in enumerate(words):
+#    wtext=word.get('text')
+#    wstart=word.get('start')
+#    wend=word.get('end')
+#    wconfid=word.get('confidence')
+#    wspeaker=word.get('speaker')
+#    #
+#    wordOut = str(wstart) + "\t" + str(wend) + "\t"
+#    if wspeaker != None:
+#        wordOut = wordOut + wspeaker
+#    
+#    #
+#    wordOut = wordOut + "\t" + str(wconfid) + "\t"
+#    if wtext != None:
+#        wordOut = wordOut + wtext
+#    
+#    #
+#    #wordOut = str(wstart) + "\t" + str(wend) + "\t" + wspeaker + "\t" + str(wconfid) + "\t" + wtext    
+#    wwf.write(wordOut)	#    #print(utterOut)	, delimiter='\t', lineterminator='\t\n'
+#    wwf.write("\r\n")
+
+#wwf.close()
+
+
+# ----------- IAB categories ----------
+
+iabCats = jj.get('iab_categories_result')
+catStatus=iabCats.get('status')
+if catStatus == 'success':
+    catDetFileName = docLabel + "_" + onlineFile + ".categoryDetails.csv"
+    cdf = open(catDetFileName, "w")
+    catDetOut = "start" + "\t" + "end" + "\t" + 'relevance' + "\t" + 'label'
+    cdf.write(catDetOut)
+    cdf.write("\r\n")
+    catDetails=iabCats.get('results')
+    for rCount, cDKey in enumerate(catDetails):     # retrieve by POSITION
+        #for count, cKey in enumerate(cDKey):            # retrieve by KEY
+        cTKey  = cDKey.get('timestamp')
+        #print(cTKey)
+        cStart = cTKey.get('start')         # will use same timestamps for all label/relevance pairs
+        #print(cStart)
+        cEnd   = cTKey.get('end')
+        #print(cEnd)
+        cLabels  = cDKey.get('labels')
+        #print(cLabels)
+        for labelCount, labelPair in enumerate(cLabels):    # retrieve by POSITION
+            cRelev = labelPair.get('relevance')
+            cLabel = labelPair.get('label')
+            catDetOut = str(cStart) + "\t" + str(cEnd) + "\t" + str(cRelev) + "\t" + str(cLabel)
+            #print(catDetOut)
+            cdf.write(catDetOut)	#    print(utterOut)	, delimiter='\t', lineterminator='\t\n'
+            cdf.write("\r\n")
+        
+    
+    cdf.close()
+
+
+# also (separately) save summaries (i.e. session-level IAB categories)
+if catStatus == 'success':
+    catFileName = docLabel + "_" + onlineFile + ".categories.csv"
+    ccf = open(catFileName, "w")
+    catOut="key" + "\t" + "relevance"
+    ccf.write(catOut)	#    print(utterOut)	, delimiter='\t', lineterminator='\t\n'
+    ccf.write("\r\n")
+    summaries=iabCats.get('summary')
+    summKeys=summaries.keys()
+    for count, cKey in enumerate(summKeys):
+        cRelev=summaries.get(cKey)
+        catOut=cKey + "\t" + str(cRelev)
+        ccf.write(catOut)	#    print(utterOut)	, delimiter='\t', lineterminator='\t\n'
+        ccf.write("\r\n")
+
+
+    ccf.close()
+
+
+# ----------- chapters ----------
+chapterVec = []
+chapterVecs = []
+chapFileName = docLabel + "_" + onlineFile + ".chapters.csv"
+ccf = open(chapFileName, "w")
+
+chapters = jj.get('chapters')   # also insert timestamp
+#write header
+chapterOut = "start" + "\t" + "end" + "\t" + "startTime" + "\t" + "summary" + "\t" + "headline" + "\t" + "gist"
+ccf.write(chapterOut)
+ccf.write("\r\n")
+
+for count, chapter in enumerate(chapters):
+    cSummary=chapter.get('summary')
+    cHeadline=chapter.get('headline')
+    cGist=chapter.get('gist')
+    cStart=chapter.get('start')
+    cStartTime = ToDisplayTime(cStart)     #supplement with legible timestamp
+    cEnd=chapter.get('end')
+    chapterOut = str(cStart) + "\t" + str(cEnd) + "\t" + str(cStartTime) + "\t" + cSummary + "\t" + cHeadline + "\t" + cGist
+    ccf.write(chapterOut)
+    ccf.write("\r\n")
+    chapterVec=[cStart, cEnd, cSummary, cHeadline, cGist]
+    chapterVecs.append(chapterVec)
+ccf.close()
+
+
+# ----------- sentiment analysis ----------
+
+ss=jj.get('sentiment_analysis_results')
+#print(ss)
+
+#   Better to use CSV package throughout!
+#with open('records.tsv', 'w', newline='') as tsvfile:
+#    writer = csv.writer(tsvfile, delimiter='\t', lineterminator='\n')
+#    for record in SeqIO.parse("/home/fil/Desktop/420_2_03_074.fastq", "fastq"):
+#        writer.writerow([record.id, record.seq, record.format("qual")])
+
+sentimentFileName = docLabel + "_" + onlineFile + ".sentiments.csv"
+ssf = open(sentimentFileName, "w")
+
+sentimOut = "start" + "\t" + "end" + "\t" + "speaker" + "\t" +  'sentiment' + "\t" + "confidence" + "\t" + "text"
+ssf.write(sentimOut)	#    print(sentimOut)	, delimiter='\t', lineterminator='\t\n'
+ssf.write("\r\n")
+
+#with open(sentimentFileName, 'w', encoding='utf8', newline='') as csvfile:
+#    writer = csv.writer(csvfile, delimiter=',', lineterminator='\n')
+#    writer.writeheader(["start","end","speaker","sentiment","confidenct","text"])
+#    #for record in SeqIO.parse("/home/fil/Desktop/420_2_03_074.fastq", "fastq"):
+#        writer.writerow([record.id, record.seq, record.format("qual")])
+
+for count, sentim in enumerate(ss):
+    stext = sentim.get('text')
+    sstart = sentim.get('start')
+    send = sentim.get('end')
+    ssentim = sentim.get('sentiment')
+    sconfid = sentim.get('confidence')
+    sspeaker = sentim.get('speaker')
+    #sentimOut = str(sstart) + "\t" + str(send) + "\t" + sspeaker + "\t" + ssentim + "\t" + str(sconfid) + "\t" + stext
+    sentimOut = str(sstart) + "\t" + str(send) + "\t"
+    if sspeaker != None:
+        sentimOut = sentimOut + sspeaker
+    
+    #
+    sentimOut = sentimOut + "\t" + str(sconfid) + "\t" + stext
+    ssf.write(sentimOut)	#    print(sentimOut)	, delimiter='\t', lineterminator='\t\n'
+    ssf.write("\r\n")
+
+ssf.close()
+
+# ----------- utterances ----------
+
+utteranceFileName = docLabel + "_" + onlineFile + ".utterances.csv"
+uuf = open(utteranceFileName, "w")
+
+utterOut = "start" + "\t" + "end" + "\t" + "speaker" + "\t" + "confidence" + "\t" + "text"
+uuf.write(utterOut)	#    print(utterOut)	, delimiter='\t', lineterminator='\t\n'
+uuf.write("\r\n")
+
+utterances = jj.get('utterances')
+
+for count, utterance in enumerate(utterances):
+    uconfid = utterance.get('confidence')
+    uend = utterance.get('end')
+    uspeaker = utterance.get('speaker')    
+    ustart = utterance.get('start')
+    utext = utterance.get('text')
+    #utterOut = str(ustart) + "\t" + str(uend) + "\t" + uspeaker + "\t" + str(uconfid) + "\t" + utext
+    utterOut = str(ustart) + "\t" + str(uend) + "\t"
+    if uspeaker != None:
+        utterOut = utterOut + uspeaker
+    
+    #
+    utterOut = utterOut + "\t" + str(uconfid) + "\t" + utext
+    uuf.write(utterOut)	#    print(utterOut)	, delimiter='\t', lineterminator='\t\n'
+    uuf.write("\r\n")
+
+uuf.close()
+
+
+# ----------- entities ----------
+
+entityFileName = docLabel + "_" + onlineFile + ".entities.csv"
+eef = open(entityFileName, "w")
+
+entityOut = "text" + "\t" + 'entity_type' + "\t" + "\t" + "start" + "\t" + "end"
+eef.write(entityOut)
+eef.write("\r\n")
+
+entities = jj.get('entities')
+for count, entity in enumerate(entities):
+    eType=entity.get('entity_type')
+    eText=entity.get('text')
+    eStart=entity.get('start')
+    eEnd=entity.get('end')
+    entityOut = eText + "\t" + eType + "\t" + "\t" + str(eStart) + "\t" + str(eEnd)
+    eef.write(entityOut)
+    eef.write("\r\n")
+
+
+eef.close()
+
+
+#------- paragraphs -------------------
+
+
+#needs myId, docLabel, onlineFile
+#myId       ="rsuh9skgre-a056-486e-8138-2e6608d21f04"
+#docLabel   = "mo007-1-SP"
+#onlineFile = "mo007-1."
+
+import requests
+import time
+import sys
+import math
+import csv
+
+endpoint = "https://api.assemblyai.com/v2/transcript/" + myId + "/paragraphs"
+headers = {"authorization": "a14f484d11984e00bf7105cda4bc0c9a"}
+response = requests.get(endpoint, headers=headers)
+time.sleep(60)
+kk=response.json()
+print("")
+print("")
+print(" *** Response from /paragraphs call ***")
+print(kk)
+print("")
+print(" *************************************")
+print("")
+
+parags=kk.get("paragraphs")	#fetch all paragraphs
+paragCount = len(parags)	#how many paragraphs?
+#print(paragCount)
+paragNum = 0
+wordPos = 0
+
+paragraphFileName = docLabel + "_" + onlineFile + ".paragraphs.csv"
+ppf = open(paragraphFileName, "w")
+
+current_speaker = "(Undefined Speaker)"
+paragSpeakers = dict()
+
+paragSpeakerFileName = docLabel + "_" + onlineFile + ".paragSpeakers.csv"
+psf = open(paragSpeakerFileName, "w")
+
+
+paragStartings = []
+rawParags = {}
+speakerCount = 0
+speakerTurns = 0
+oldWEnd = 0   # end of preceding word; matches current_speaker
+#   needed to end preceding paragraph when change of speaker triggers end-of-paragraph event
+
+#Also record PARAGRAPH version of words: Speaker can VARY within paragraph!        # also insert timestamp, "Corrected Text".
+paragWordFileName = docLabel + "_" + onlineFile + ".paragWords.csv"
+pwf = open(paragWordFileName, "w")
+wordOut = "start" + "\t" + "end" + "\t" + "speaker" + "\t" + "confidence"  + "\t" + "paragWordPos" + "\t" + "wordPos" + "\t" + "text"
+pwf.write(wordOut)
+pwf.write("\r\n")
+
+#Column headers
+paragOut = "start" + "\t" + "end" + "\t" + "paragNum" + "\t" + "speaker" + "\t" + "confidence" + "\t" + "startTime" + "\t" + "wordCount" + "\t" + "text"
+ppf.write(paragOut)
+ppf.write("\r\n")
+
+#if docLabel in paragSpeakers:       # re-run; delete old slot
+#    paragSpeakers[docLabel] = { }
+#    print()
+
+for p0 in parags:
+    paragNum += 1
+    paragWordPos = 0      # count of words within paragraph
+    text=p0.get('text')		#text of paragraph
+    start=p0.get('start')		#starting milisecond of paragraph
+    paragStartings.append(start)
+    pStartTime = ToDisplayTime(start)     # supplement with legible timestamp
+    end=p0.get('end')		#text of paragraph
+    pconfid = p0.get('confidence')	#paragraph-level confidence
+    words=p0.get('words')		#list of words
+    wordCount = len(words)
+    w1_0=words[0]          		#first word - use only "speaker" of first word
+    sp=w1_0.get('speaker')      	#Label entire paragraph with first speaker
+    
+    # Record start of each speech turn (usually several per speaker)
+    if sp != current_speaker:
+        current_speaker = sp
+        speakerTurns += 1
+        if sp in paragSpeakers:
+            paragSpeakers[sp].append(start)
+        else:
+            paragSpeakers[sp] = [start]	     # First speech turn only
+            speakerCount += 1
+        #
+    #
+    paragFirstWordCount = wordPos + 1     #position within document, of first word in paragraph
+    
+    for wCount, word in enumerate(words):   # Now extract all info on included words
+        wordPos += 1     #position of word within document
+        paragWordPos += 1     #position of word within paragraph
+        wtext=word.get('text')
+        wstart=word.get('start')
+        wend=word.get('end')
+        wconfid=word.get('confidence')
+        wspeaker=word.get('speaker')
+        #wordOut = str(wstart) + "\t" + str(wend) + "\t" + wspeaker + "\t" + str(wconfid) + "\t" + wtext    
+        wordOut = str(wstart) + "\t" + str(wend) + "\t"
+        if wspeaker != None and len(wspeaker)>0:
+            wordOut += wspeaker
+        
+        wordOut += "\t" + str(wconfid)  + "\t" + str(paragWordPos) + "\t" + str(wordPos) + "\t" + wtext
+        pwf.write(wordOut)	#    print(utterOut)	, delimiter='\t', lineterminator='\t\n'
+        pwf.write("\r\n")
+    #
+    paragLastWordCount = wordPos  # count of most recently-counted word within document, is last word in paragraph
+
+    paragOut = str(start) + "\t" + str(end) + "\t" + str(paragNum) + "\t"
+    if sp != None and len(sp) > 0:
+        paragOut += sp
+    #
+    paragOut += "\t" + str(pconfid)
+    paragOut += "\t" + str(pStartTime)
+    
+    paragOut += "\t" + str(wordCount)
+    paragOut += "\t" + text     # '+ "\t" + text' for manual editing. IF you use a spreadsheet, REMEMBER to set the "text" columns very wide before saving!!
+    ppf.write(paragOut)
+    ppf.write("\r\n")
+
+    # parag start/end millisecond, parag #, first speaker, confid, # words in parag, (document-level) start/last word #
+    rawParags.update( {start: [end, paragNum, sp, pconfid, wordPos, paragWordPos, paragFirstWordCount, paragLastWordCount] } )
+    #rawParags.update( {start: {'end':wend, 'paragNum':paragNum, 'speaker':wspeaker, 'confid':wconfid, 'wordPos':wordPos, 'paragFirstWordCount':paragFirstWordCount} } )
+
+#display first occurrence of each speaker, with first time (in three formats)
+#print("paragSpeakers:")
+#print(paragSpeakers)
+#{'A': [1200, 3000], 'B': [2400]}
+
+speakerTimeOut = 'docLabel' + "\t" + "sp" + "\t" + "myTime" + "\t" + "myTimeDisplay" + "\t" + "myTimeSRT"
+psf.write(speakerTimeOut)
+psf.write("\r\n")
+
+paragSpeakerKeys=paragSpeakers.keys()
+for sp in paragSpeakerKeys:
+    timeList = paragSpeakers.get(sp)
+    for tcc, myTime in enumerate(timeList):
+        #paragSpeakers[docLabel]   = {start: sp}
+        speakerTimeOut = docLabel + "\t" + sp + "\t" + str(myTime) + "\t" + ToDisplayTime(myTime) + "\t" + ToSRTTime(myTime)
+        psf.write(speakerTimeOut)
+        psf.write("\r\n")
+    #
+
+#
+ppf.close()
+pwf.close()
+psf.close()
+
+print(" Speakers (from Paragraphs output):")
+print(paragSpeakerKeys)
+for sp in paragSpeakerKeys:
+    timeList = paragSpeakers.get(sp)
+    print(sp + " @ " + ToDisplayTime(timeList[0]))
+
+#--------- Sentence(s) -----------------
+
+#myId="rs8dx3ybuk-75db-405d-950b-560ec269d003"
+
+endpoint = "https://api.assemblyai.com/v2/transcript/" + myId + "/sentences"
+headers = {
+    "authorization": "a14f484d11984e00bf7105cda4bc0c9a"}
+sResponse = requests.get(endpoint, headers=headers)
+time.sleep(30)
+sss=sResponse.json()
+myStatus=sss.get('status')
+print(myStatus)
+print("")
+print("")
+print(" *** Response from /sentences call ***")
+print(sss)
+print("")
+print(" *************************************")
+print("")
+
+paragTimes = []
+paragTimes = rawParags.keys()   # Key (i.e. paragraph-start time) may be all we need hereafter
+
+current_speaker = "(Undefined Speaker)"
+wordPos = 0     # starting thru document from top
+
+sents=sss.get("sentences")	#fetch all sentences
+sentCount = len(sents)	#how many sentences?
+sentNum = 0
+
+sentenceFileName = docLabel + "_" + onlineFile + ".sentences.csv"
+sssf = open(sentenceFileName, "w")
+#Column headers
+sentOut = "start" + "\t" + "end" + "\t" + "sentNum" + "\t" + "speaker" + "\t" + "confidence" + "\t" + "text"
+sssf.write(sentOut)
+sssf.write("\r\n")
+
+sentWordFileName = docLabel + "_" + onlineFile + ".sentWords.csv"
+sswf = open(sentWordFileName, "w")
+sentWOut = "start" + "\t" + "end" + "\t" + "sentNum" + "\t" + "speaker"  + "\t" + "confidence" + "\t" "wordPosSent" + "\t" + "wordPosDoc" + "\t" + "text"
+sswf.write(sentWOut)
+sswf.write("\r\n")
+
+for s0 in sents:
+    sentNum += 1
+    sentWordPos = 0         # no words yet seen in this sentence
+    text=s0.get('text')		#text of sentence
+    start=s0.get('start')		#text of sentence
+    end=s0.get('end')		#text of sentence
+    pconfid = s0.get('confidence')	#sentence-level confidence
+    w1=s0.get('words')		#list of words
+    w1_0=w1[0]              #first word - use only "speaker" of first word
+    sp=w1_0.get('speaker')      	#Label entire sentence with first speaker
+    #
+    if str(start) in paragTimes:
+        paragBreak = True
+        paragNum = rawParags.get('paragNum')
+    else:
+        paragBreak = False
+        paragNum = 0
+    #
+    for wCount, word in enumerate(w1):   # Now extract all info on included words
+        wordPos += 1     #position of word within document
+        sentWordPos += 1     #position of word within sentence 
+        wtext=word.get('text')
+        wstart=word.get('start')
+        wend=word.get('end')
+        wconfid=word.get('confidence')
+        wspeaker=word.get('speaker')
+        #sentenceWords = [wstart, wend, sentNum, wspeaker, wconfid, sentWordPos, wordPos, wtext]
+                #wordOut = str(wstart) + "\t" + str(wend) + "\t" + wspeaker + "\t" + str(wconfid) + "\t" + wtext    
+        wordOut = str(wstart) + "\t" + str(wend) + "\t" + str(sentNum) + "\t"
+        if wspeaker != None and len(wspeaker)>0:
+            wordOut += wspeaker
+        #
+        if len(paragNum) > 0:
+            wordOut += str(paragNum)
+        #
+        wordOut += "\t" + str(wconfid)  + "\t" + str(sentWordPos) + "\t" + str(wordPos) + "\t" + wtext
+        sswf.write(wordOut)
+        sswf.write("\r\n")
+    # sentOut = str(start) + "\t" + str(end) + "\t" + sp + "\t" + str(pconfid) + "\t" + text
+    sentOut = str(start) + "\t" + str(end) + "\t" + str(sentNum) + "\t" 
+    if sp != None:          # 'sentence-level speaker.' Don't rely on this at word level.
+        sentOut += sp
+    #
+    sentOut += "\t" + str(pconfid) + "\t" + text
+    sssf.write(sentOut)
+    sssf.write("\r\n")
+    #
+    if (sp != current_speaker) or (start in paragStartings):
+        print("Magic new paragraph, speaker '" + wspeaker + " " + str(wstart))
+    #
+
+sssf.close()
+sswf.close()
+
+
+# ------------ SRT -----------
+
+import requests
+import time
+import sys
+import math
+import csv
+
+#docLabel = "parseSRT" 
+#onlineFile = "ls040-0"
+
+srtFileName = docLabel + "_" + onlineFile + ".srt"
+srtf = open(srtFileName, "w")
+
+#myId="rsfzjbpypn-f1ff-4dc4-9aca-0526544dc4ed"
+
+endpoint = "https://api.assemblyai.com/v2/transcript/" + myId + "/srt?chars_per_caption=40"        # "/srt?chars_per_caption=40"  "/paragraphs"
+headers = {"authorization": "a14f484d11984e00bf7105cda4bc0c9a"}
+sResponse = requests.get(endpoint, headers=headers)
+
+srtf.write(sResponse.text)
+srtf.write("\r\n")
+
+srtf.close()
+
+#time.sleep(30)
+#srts=sResponse.json()
+#print(srts)
+#myStatus=srts.get('status')
+#print(myStatus)
+
+
+#srtOut = srtOut + "\t" + str(pconfid) + "\t" + text
+#srtf.write(srtOut)
+
+print("Thanks for the call!")
+quit()
diff --git a/Scripts/2_sentencesToTranscripts.py b/Scripts/2_sentencesToTranscripts.py
new file mode 100644
index 0000000..5cf1150
--- /dev/null
+++ b/Scripts/2_sentencesToTranscripts.py
@@ -0,0 +1,680 @@
+
+#cd "/mnt/d/Documents/FEP-AI/2022 ModelStream/mo007/SPtest"
+#   python3 "/mnt/d/Documents/FEP-AI/Active Inference Podcast/sentencesToTranscripts.py" mo007-1 "." "mo007-1_mo007-1.mp3.sentences.csv" | tee mo007-1_publish.txt
+
+#AllSpeakers "/mnt/d/Documents/FEP-AI/Active Inference Podcast/AllSpeakers.csv"
+
+import csv
+import time
+import sys
+import math
+import json
+from html.parser import HTMLParser
+
+if __name__ == "__main__":
+    print(f"Arguments count: {len(sys.argv)}")
+    if len(sys.argv) == 1:
+        print("paragraphsToTranscripts. Needs parameters docLabel (key binding references to this doc),")
+        print("inSentDir (path to incoming files), inSentFile (name of driver file *.sentences.csv).")
+        print("Optional params outDir (defaults to working directory '.'), speakers (defaults to a central CSV identifying all speakers).")
+        print("Created in outDir: *_transcript.txt, *_built.srt, *_built.xhtml")
+        print("If inSentDir holds a *.paragraphs.csv file, it's used to force paragraph ends.")
+        quit()
+    elif len(sys.argv) < 4:
+        print("Need at least docLabel, inSentDir, and inSentFile; optional outDir, speakers. Exiting!")
+        quit()
+
+#File references:
+#	inSentDir/inSentFile     Driver
+#	inSpeakerDir/inSpeakers When mappings known
+#   [inSentDir]/inWords    Improves timestamp splitting; optional
+#	outDir/ One destination for everything
+#Parameters:
+#   MaxChars    For SRT: Max line len in chars
+
+#outDir = "/mnt/d/Documents/FEP-AI/2022 Livestreams/ActInf Livestream #035 A tale of Two architectures/ls035-0/publish"
+
+inSpeakerDir = "/mnt/d/Documents/FEP-AI/Active Inference Podcast/"
+inSpeakers = "AllSpeakers.csv"
+
+docLabel = sys.argv[1]
+inSentDir = sys.argv[2]
+inSentFile = sys.argv[3]
+print("docLabel, inSentDir, inSentFile " + "'" + docLabel + "', '" +  inSentDir + "', '" + inSentFile + "'")
+
+#inSentDir = "/mnt/d/Documents/2022 Org Streams/os003/"
+inParagFile = inSentFile.replace('.sentences.', '.paragraphs.')
+
+if len(sys.argv) > 4:
+    outDir = sys.argv[4]
+else:
+    outDir = "."    #publish to working directory!
+
+print("outDir: " + "'" + outDir + "'")
+
+if len(sys.argv) > 5:
+    speakerFile = sys.argv[5]
+else:
+    speakerFile = "/mnt/d/Documents/FEP-AI/Active Inference Podcast/AllSpeakers.csv"
+
+print('speakers File: ' + "'" + speakerFile + "'")
+
+# globals
+speakerDesc = {}
+
+# ++++++ notes ++++++
+
+#prepare to compare to Google/YouTube word list
+#confidSentWordList = sentWordVec
+#confidSentWordList.sort(reverse=True, key = lambda x: x[3])     # descending by confidence
+#print(confidSentWordList)
+
+#where the fourth component of sentenceWords is confidence, the following gives the highest-confidence words at the top:
+#sentenceWords.sort(reverse=True, key = lambda x: x[3])
+
+# "Correct Whisper per YouTube (ls038-2).ods"
+
+
+# ----- notes -----
+
+
+
+# ------- Utility functions --------------
+
+def hhMmSsToTime(ts):
+    tsLen = len(ts)
+    print("in hhMmSsToTime; ts/tsLen:")
+    print(ts)
+    print(tsLen)
+    if tsLen == 8:		# hh:mm:ss
+        hh = int(ts[0:2])
+        mm = int(ts[3:5])
+        ss = int(ts[6:8])
+        to_time= 3600000*hh + 60000*mm + 1000*ss
+        return to_time
+    elif tsLen == 7:		# h:mm:ss
+        hh = int(ts[0:1])
+        mm = int(ts[2:4])
+        ss = int(ts[5:7])
+        to_time= 3600000*hh + 60000*mm + 1000*ss
+        return to_time
+    elif tsLen == 5:		# mm:ss
+        mm = int(ts[0:2])
+        ss = int(ts[3:5])
+        to_time= 60000*mm + 1000*ss
+        return to_time
+    elif tsLen == 4:  		# m:ss
+        mm = int(ts[0:1])
+        ss = int(ts[2:4])
+        to_time= 60000*mm + 1000*ss
+        return to_time
+    else:
+        return 9999999
+    #
+#
+
+
+
+def ToDisplayTime(tt):
+    ts=float(0.0+int(tt))
+    h0=int(ts/3600000.0)
+    hh=""
+    if h0 > 9:
+        hh = str(100+h0)
+        hh = hh[1:3] + ":"
+    elif h0 > 0:
+        hh = str(h0) + ":"
+    
+    m0=int( (ts-(3600000.0*h0))/60000.0)
+    mm=str(100+m0)
+    s0=int( (ts - (3600000.0*h0) - (60000.0*m0) ) /1000.0)
+    ss=str(100+s0)
+    to_time= hh + mm[1:3] + ":" + ss[1:3]
+    return to_time
+
+
+1
+
+#j=ToDisplayTime(64968112)
+#print(j)
+#j = ToDisplayTime(4968112)
+#print(j)
+#j = ToDisplayTime(70337)
+#print(j)
+#j = ToDisplayTime(2337)
+#print(j)
+
+
+def ToSRTTime(tt):
+    ts=float(0.0+int(tt))
+    h0=int(ts/3600000.0)
+    hh = str(100+h0)
+    m0=int( (ts-(3600000.0*h0))/60000.0)
+    mm=str(100+m0)
+    s0=int( (ts - (3600000.0*h0) - (60000.0*m0) ) /1000.0)
+    ss=str(100+s0)
+    mms0=int(ts - (3600000.0*h0) - (6000*m0) - s0)
+    mms=str(1000+mms0)
+    to_time= hh[1:3] + ":" + mm[1:3] + ":" + ss[1:3] + "," + mms[1:4]
+    return to_time
+
+#j=ToSRTTime(64968112)
+#print(j)
+#j = ToSRTTime(4968112)
+#print(j)
+#j = ToSRTTime(70337)
+#print(j)
+#j = ToSRTTime(2337)
+#print(j)
+
+def secToTime(ss):
+    if ss >= 3600000:
+        h0=int(ss/3600000.0)
+        hh = str(100+h0)
+        m0=int( (ss-(3600000.0*h0))/60000.0)
+        mm=str(100+m0)
+        s0=int( (ss - (3600000.0*h0) - (60000.0*m0) ) /1000.0)
+        ss=str(100+s0)
+        mms0=int(ss - (3600000.0*h0) - (6000*m0) - s0)
+        mms=str(1000+mms0)
+        to_time= hh[1:3] + ":" + mm[1:3] + ":" + ss[1:3] + "," + mms[1:4]
+        return to_time
+    else:
+        m0=int( ss / 60000.0)
+        mm=str(100+m0)
+        s0=int( (ss  - (60000.0*m0) ) /1000.0)
+        ss=str(100+s0)
+        mms0=int(ss - (6000*m0) - s0)
+        mms=str(1000+mms0)
+        to_time= mm[1:3] + ":" + ss[1:3] + "," + mms[1:4]
+        return to_time
+    #
+#
+
+
+
+
+# ------- "Business" functions --------------
+
+def speakerIdToName(doc, id, myTime):
+# Default; override if possible from inSpeakers
+    #print("ord, len of '" + id)
+    #print(ord(id))
+    #print(len(id))
+    if len(id) > 1:     # speaker already spelled out in 'sentences' input
+        return id
+    #
+    speaker = "Speaker " + id   # default
+    #print("speakerDesc")
+    #print(speakerDesc)
+    spDesc = speakerDesc.get(id)
+    #print("spDesc")
+    #print(spDesc)
+    if spDesc is not None:
+        dName = spDesc.get('displayedName')
+        #print("dName")
+        #print(dName)        
+        if dName is not None and len(dName)>0:
+            speaker = dName
+        #
+    #
+    return speaker
+    #
+#
+
+
+
+# ---------------- MAIN -----------------
+
+#outDir = "/mnt/d/Documents/FEP-AI/2022 Livestreams/ActInf Livestream #035 A tale of Two architectures/ls035-1/publish"
+
+inSpeakerDir = "/mnt/d/Documents/FEP-AI/2022 Livestreams/ActInf Livestream #040 - Chris Fields... A free energy principle for generic quantum systems/ls040-1_noSpeaker"
+inSpeakers = "noSpeaker_ls040-0.Speakers.csv"
+inSpeakerDir = "/mnt/d/Documents/FEP-AI/Active Inference Podcast"
+inSpeakers = "AllSpeakers.csv"
+
+
+#inSentDir = "/mnt/d/Documents/FEP-AI/2022 Livestreams/ActInf Livestream #040 - Chris Fields... A free energy principle for generic quantum systems/ls040-1_noSpeaker"
+#inSentFile = "ls036-0_ls036-0.m4a.paragraphs.csv"
+#inSentDir = "/mnt/d/Documents/FEP-AI/2022 Livestreams/ActInf Livestream #036 Modeling Ourselves/ls036-0"
+#inSentFile = "ls036-0_ls036-0.m4a.paragraphs.csv"
+#inSentDir = "/mnt/d/Documents/FEP-AI/2022 Org Streams/os003"
+#inSentFile = "Bijan_os003-1.m4a.paragraphs.csv"
+
+
+
+#CSV column headers:
+#   paragraph: start, end, speaker, confid, text
+#   speakers: VideoLabel, SpeakerLabel, DisplayedSpeakerName, FullSpeakerName, FirstTurn, RangeFrom, RangeTo, Notes
+
+inSpeakerPath = inSpeakerDir
+if inSpeakerPath[-1] != "/":
+    inSpeakerPath += "/"
+
+inSpeakerPath += inSpeakers
+#docLabel = "ls21-04"
+#
+#csv_reader = csv.reader(csv_file, delimiter=',')
+#csv_reader = csv.DictReader(csv_file)
+#csv_reader = csv.DictReader(csv_file, fieldnames = ("VideoLabel", "SpeakerLabel", "DisplayedSpeakerName", "FullSpeakerName", "FirstTurn", "RangeFrom", "RangeTo", "Notes" ), delimiter=',')
+#with io.open("file", "r", newline=None) as fd:
+with open(inSpeakerPath) as speaker_file:
+    speaker_reader = csv.reader(speaker_file, delimiter=',')
+    line_count = 0
+    for row in speaker_reader:
+        if line_count == 0:
+            print(f'Column names are {", ".join(row)}')
+            line_count += 1
+        else:
+            rowLen=len(row)
+            reportString = ""
+            if rowLen > 2 and row[1] is not None and len(row[1]) > 0:
+                if row[0] is not None and len(row[0]) > 0:
+                    videoLabel = row[0]
+                    #reportString += "In video " + row[0] + ", "
+                else:
+                    videoLabel = ""
+                #
+                speakerLabel = row[1]
+                #
+                if rowLen > 2 and row[2] is not None and len(row[2]) > 0:
+                    displayedName = row[2]
+                    #reportString += "In video " + row[0] + ", "
+                else:
+                    displayedName = "Speaker " + speakerLabel
+                #
+                #reportString += "'" + row[1] + "' stands for '" + row[2] + "'"
+                if rowLen > 3 and row[3] is not None and len(row[3]) > 0:
+                    fullName = row[3]
+                else:
+                    fullName = ""
+                    #reportString += " (better known as '" + row[3] + "')"
+                #
+                if rowLen > 4 and row[4] is not None and len(row[4]) > 0:
+                    firstTurn = row[4]
+                else:
+                    firstTurn = ""
+                    #reportString += " after timestamp " + row[5]
+                #
+                if rowLen > 5 and row[5] is not None and len(row[5]) > 0:
+                    rangeFrom = row[5]
+                else:
+                    rangeFrom = ""
+                # 
+                if rowLen > 6 and row[6] is not None and len(row[6]) > 0:
+                    rangeTo = row[6]
+                else:
+                    rangeTo = ""
+                # 
+                if rowLen > 7 and row[7] is not None and len(row[7]) > 0:
+                    notes = row[7]
+                else:
+                    notes = ""
+                # 
+                #
+                if videoLabel == docLabel:      # maybe allow defaulting with videoLabel = ''?
+                    speakerDesc[speakerLabel] = {'videoLabel': videoLabel, 'displayedName': displayedName, 'fullName':fullName, 'firstTurn':firstTurn, 'rangeFrom':rangeFrom, 'rangeTo':rangeTo, 'notes':notes}
+                    #print(f'Loaded speaker description {", ".join([videoLabel, speakerLabel, displayedName, fullName, firstTurn, rangeFrom, rangeTo, notes])}')
+                #
+            line_count += 1
+
+#print(f'Processed {line_count} speaker descriptions.')
+
+speaker_file.close()
+
+# -------- paragraphs CSV
+
+if inSentDir[-1] != "/":
+    inSentDir += "/"
+
+inParagPath = inSentDir + inParagFile
+#inSentencePath = inParagPath
+#inParagPath += inSentFile
+#inSentencePath += inSentFile
+
+#parag_reader = csv.DictReader(parag_file, fieldnames = ("start", "end", "speaker", "confid", "text" ))
+#parag_reader = csv.DictReader(parag_file, fieldnames = ("start", "end", "speaker", "confid", "text" ), delimiter='\t')
+#parag_reader = csv.reader(parag_file, delimiter=',')
+
+
+rawParags = {}
+
+paragPubPath = outDir 
+
+if paragPubPath[-1] != "/":
+    paragPubPath += "/"
+
+paragPubPath += inSentFile + "_paragTranscript.txt"
+
+pPubF = open(paragPubPath, "w")
+
+reportableTime = 0
+parag_count = 0
+paragWordCount = 0
+current_speaker = "(Unknown Speaker)"
+#with io.open("file", "r", newline=None) as fd:
+parag_file = open(inParagPath, "r", newline=None)
+if (parag_file == None):
+    print(inParagPath + " not found")
+else:
+    allParags = parag_file.readlines()
+    for pCount, paragRow in enumerate(allParags):
+        if pCount == 0:
+            print("Paragraph headers: " + paragRow)
+        else:
+            row = paragRow.split('\t')
+            rowLen = len(row)
+            #print(row)
+            #if row[0] is not None and len(row[0]) > 0:
+            reportString = ""
+            start = row[0]
+            #print(start)
+            #reportString += "Paragraph starts at millisecond " + row[0] + ", "
+            end = row[1]            
+            #reportString += "ends at " + row[1] + " "
+            if row[2] is not None and len(row[2]) > 0:
+                speaker = row[2]
+            else:
+                speaker = ""
+            
+            #
+            if rowLen > 3 and row[3] is not None and len(row[3]) > 0:
+                confid = row[3]
+                #reportString += ", confidence " + row[3] + " "
+            else:
+                confid = ""
+            
+            #
+            if rowLen > 4 and row[4] is not None and len(row[4]) > 0:
+                startTime = row[4]
+                #reportString += '"' + row[4].strip('\n') + '"'
+            else:
+                startTime = ""
+            
+            if rowLen > 5 and row[5] is not None and len(row[5]) > 0:
+                text = row[5]
+                #reportString += '"' + row[5].strip('\n') + '"'
+            else:
+                text = ""
+            
+            if rowLen > 6 and row[6] is not None and len(row[6]) > 0:
+                correctedText = row[6]
+                #reportString += '"' + row[6].strip('\n') + '"'
+            else:
+                correctedText = ""
+
+            if rowLen > 7 and row[7] is not None and len(row[7]) > 0:
+                firstWordCount = row[7]
+                #reportString += '"' + row[7].strip('\n') + '"'
+            else:
+                firstWordCount = 0
+
+            if rowLen > 8 and row[8] is not None and len(row[8]) > 0:
+                lastWordCount = row[8]
+                #reportString += '"' + row[8].strip('\n') + '"'
+            else:
+                lastWordCount = 0
+
+            rawParags.update( {start : [end, speaker, confid, firstWordCount, lastWordCount] } )
+
+            #
+            if len(speaker)>0 or len(startTime) > 0 or len(text) > 0 or len(correctedText) > 0:
+                # Now build next one, two, or three lines of output ([emptyLine] [speaker line] text)
+                if len(correctedText) > 0:
+                    myText = correctedText
+                else:
+                    myText = text
+                
+                #
+                if len(speaker) > 0 and speaker != current_speaker:
+                    pPubF.write("")     # empty line before next speech act
+                    pPubF.write("\r\n")
+                    reportString = startTime + " " # + speakerIdToName(speaker) + ":"        # Also account for missing or illformed start-time
+                    
+                    reportString += speakerIdToName(docLabel, speaker, reportableTime) + ":"
+                    #
+                    #xx=speakerIdToName(docLabel, speaker, reportableTime)
+                    #if len(speaker) == 1:
+                    #    reportString += "Speaker " + speaker + ":"      # use lookup instead
+                    #else:
+                    #    reportString += speaker + ":"
+                    #
+                    #
+                    print(reportString)
+                    pPubF.write(reportString)
+                    pPubF.write("\r\n")
+                    current_speaker = speaker
+                    reportString = myText
+                    print(reportString)
+                    pPubF.write(reportString)
+                    pPubF.write("\r\n")
+                else:
+                    #reportString = ToDisplayTime(start) + " " + text
+                    reportString = startTime + " " + myText
+                    print(reportString)
+                    pPubF.write(reportString)
+                    pPubF.write("\r\n")
+                
+                #
+            
+            #
+        
+    #
+    print(f'Processed {pCount} paragraphs.')
+
+#
+parag_file.close()
+pPubF.close()
+
+print(rawParags)
+
+
+# -------- sentences CSV
+
+inSentPath = inSentDir + "/" + inSentFile
+
+sentPubPath = outDir 
+
+sentPubPath += inSentFile + "_transcript.txt"
+
+sPubF = open(sentPubPath, "w")
+rawSents = {}
+accumedParag = ""
+sent_count = 0
+sentWordCount = 0
+lastReportTime = 0
+currentSpeaker = "(Unknown Speaker)"
+lastReportTime = 0
+
+paragTimes = rawParags.keys()
+print("")
+print(paragTimes)
+print("")
+
+#with io.open("file", "r", newline=None) as fd:
+sent_file = open(inSentPath, "r", newline=None)
+if (sent_file == None):
+    print(inSentPath + " not found")
+else:
+    allSents = sent_file.readlines()
+    for pCount, sentRow in enumerate(allSents):
+        if pCount == 0:
+            print("Sentence headers: " + sentRow)
+        else:
+            row = sentRow.split('\t')
+            rowLen = len(row)
+            #print(row)
+            #if row[0] is not None and len(row[0]) > 0:
+            reportString = ""
+            start = int(row[0])
+            #print(start)
+            #reportString += "Sentence starts at millisecond " + row[0] + ", "
+            end = int(row[1])
+            #reportString += "ends at " + row[1] + " "
+            if rowLen >= 3 and row[2] is not None and len(row[2]) > 0:
+                speaker = row[2]
+            else:
+                speaker = ""
+            
+            #
+            if rowLen >= 4 and row[3] is not None and len(row[3]) > 0:
+                confid = float(row[3])
+                #reportString += ", confidence " + row[3] + " "
+            else:
+                confid = ""
+            
+            #
+            if rowLen >= 5 and row[4] is not None and len(row[4]) > 0:
+                startTime = row[4]
+                #reportString += '"' + row[4].strip('\n') + '"'
+            else:
+                startTime = ""
+            
+            if rowLen >= 6 and row[5] is not None and len(row[5]) > 0:
+                text = row[5].rstrip()
+                #reportString += '"' + row[5].strip('\n') + '"'
+            else:
+                text = ""
+            
+            if rowLen >= 7 and row[6] is not None and len(row[6]) > 0:
+                correctedText = row[6].rstrip()
+                #reportString += '"' + row[6].strip('\n') + '"'
+            else:
+                correctedText = ""
+            
+            if rowLen >= 8 and row[7] is not None and len(row[7]) > 0:
+                speakerName = row[7]
+                #reportString += '"' + row[7].strip('\n') + '"'
+            else:
+                speakerName = 0
+            
+            #
+            if str(start) in paragTimes:
+                paragBreak = True
+                #print(str(start) + " in paragTimes")
+            else:
+                paragBreak = False
+                #print(str(start) + " NOT in paragTimes")
+            
+            #if len(speaker)>0 or len(startTime) > 0 or len(text) > 0 or len(correctedText) > 0:
+            if len(speaker)>0 or len(text) > 0:
+                # Now build next one, two, or three lines of output ([emptyLine] [speaker line] text)
+                if len(correctedText) > 0:
+                    myText = correctedText
+                else:
+                    myText = text
+                #
+                if len(speaker) > 0 and speaker != currentSpeaker:
+                    if len(accumedParag) > 0:
+                        sPubF.write(accumedParag)
+                        sPubF.write("\r\n")
+                        accumedParag = ""
+                    #
+                    sPubF.write("")     # empty line before next speech act
+                    sPubF.write("\r\n")
+                    #if len(startTime) > 0:
+                    #    reportableTime = int(hhMmSsToTime(startTime))
+                    #    reportString   = startTime
+                    #else:
+                    reportableTime = start
+                    reportString   = ToDisplayTime(start)
+                    #
+                    #reportString += " " 		# + speakerIdToName(speaker) + ":"        # Also account for missing or illformed start-time
+                    
+                    reportString += " " + speakerIdToName(docLabel, speaker, reportableTime) + ":"
+                    
+                    #xx=speakerIdToName(docLabel, speaker, reportableTime)
+                    #if len(speaker) == 1:
+                    #    reportString += " Speaker " + speaker + ":"      # use lookup instead
+                    #else:
+                    #    reportString += " " + speaker + ":"
+                    #
+                    print(reportString)
+                    sPubF.write(reportString)
+                    sPubF.write("\r\n")
+                    currentSpeaker = speaker
+                    lastReportTime = reportableTime                    
+                    reportString = myText
+                    print(reportString)
+                    #sPubF.write(reportString)
+                    #sPubF.write("\r\n")
+                    if len(accumedParag) > 0:
+                        accumedParag += " " + reportString
+                    else:
+                        accumedParag = reportString
+                    #
+                elif paragBreak:
+                    print("New paragraph per upstream Whisper heuristic")
+                    if len(accumedParag) > 0:
+                        sPubF.write(accumedParag)
+                        sPubF.write("\r\n")
+                        accumedParag = ""
+                    #
+                    reportableTime = start
+                    if (0 + reportableTime) > (60000 + lastReportTime):	# Only some 'forced paragraphs' need timestamp
+                        displayTime = ToDisplayTime(start)
+                        reportString = displayTime + " "
+                        lastReportTime = reportableTime
+                    else:
+                        reportString = ""
+                    #
+                    reportString += myText
+                    print(reportString)
+                    #sPubF.write(reportString)
+                    #sPubF.write("\r\n")
+                    if len(accumedParag) > 0:
+                        accumedParag += " " + reportString
+                    else:
+                        accumedParag = reportString
+                    #
+                else:
+                    #if len(startTime) > 0:
+                    #    reportableTime = int(hhMmSsToTime(startTime))
+                    #    print("converted startTime:")
+                    #    print(reportableTime)
+                    #else:
+                    reportableTime = start
+                    #print("saved start:")
+                    print(reportableTime)
+                    #
+                    print("[typeOf] lastReportTime:")
+                    print(type(lastReportTime))
+                    print(lastReportTime)                    
+                    print("[typeOf] reportableTime:")
+                    print(type(reportableTime))                    
+                    print(reportableTime)
+                    if (0 + reportableTime) > (60000 + lastReportTime):	# report time every 60 seconds                    
+                        if len(accumedParag) > 0:
+                            sPubF.write(accumedParag)
+                            sPubF.write("\r\n")
+                            accumedParag = ""
+                        #
+                        #if len(startTime) > 0:
+                        #    displayTime = startTime
+                        #else:
+                        displayTime = ToDisplayTime(start)
+                        #
+                        reportString = displayTime + " "
+                        lastReportTime = reportableTime
+                    else:
+                        reportString = ""
+                    #
+                    reportString += myText
+                    print(reportString)
+                    #sPubF.write(reportString)
+                    #sPubF.write("\r\n")
+                    if len(accumedParag) > 0:
+                        accumedParag += " " + reportString
+                    else:
+                        accumedParag = reportString
+                    #
+                #
+            #
+        #
+    #
+    print(f'Processed {pCount} sentences.')
+
+#
+sent_file.close()
+sPubF.close()
+