Date: Wed, 3 Nov 1993 19:39:47 GMT From: Technically Sweet Subject: SCI: references on 3d audio In comp.human-factors robbie@dciem.dciem.dnd.ca (G.Robert Arrabito) writes: ------------- In terms of a company which specializes in writing software for creating 3d audio, try Bo Gehring, Focal Point 3d Audio. Email is gehring@dgp.toronto.edu Voice is 416-963-9188 ------------- From: Bowden Wise Included below are my references on the use of sound in computers, and other related audio papers. It is not sorted out to those that specifically use 3D, but there are some 3D papers below. In particular the work at NASA by Elizabeth Wenzel. %% Integration of Sound %% @InProceedings{degen92, author = "Leo Degen and Richard Mander and Gitta Salomon", title = "Working with Audio: Integrating Personal Tape Recorders and Desktop Computers", booktitle = "CHI'92 Proceedings", year = 1992, pages = "413-418", organization = "ACM SIGCHI", publisher = "ACM Press", address = "New York", month = "May 3-7" } @InProceedings{wenzel91a, author = "Eilizabeth M. Wenzel and Frederic L. Wightman and Doris J. Kistler", title = "Localization with Non-Individualized Virtual Acoustic Displays", booktitle = "CHI'91 Proceedings", year = 1991, pages = "351-359", organization = "ACM SIGCHI", publisher = "ACM Press", address = "New York", month = "April 27 - May 2" } @Article{durlach91, author = "Nat Durlach", title = "Auditory Localization in Teleoperator and Virtual Environment Systems: Ideas, Issues, and Problems", journal = "Perception", year = 1991, volume = 20, pages = "543-554" } @InCollection{wenzel92b, author = "Elizabeth M. Wenzel", title = "Three-Dimensional Virtual Acoustic Displays", booktitle = "Multimedia Interface Design", publisher = "ACM Press", year = 1992, editor = "Merra M. Blattner and Roger B. Dannenberg", series = "Frontier Series", pages = "257-288" } % % Localization of sound % @Article{kistler92, author = "Doris J. Kistler and Frederic L. Wightman", title = "A Model of Head-Related Transfer Functions Based on Principal Components and Analysis and Minimum-Phase Reconstruction", journal = "Journal of the Acoustical Society of America", year = 1992, volume = 91, number = 3, pages = "1637-1647", month = "March" } @Article{wightman92, author = "Frederic L. Wightman and Doris J. Kistler", title = "The Dominant Role of Low-Frequency Interaural Time Differences in Sound Localization", journal = "Journal of the Acoustical Society of America", year = 1992, volume = 91, number = 3, pages = "1648-1661", month = "March" } @Article{wightman89a, author = "Frederic L. Wightman and Doris J. Kistler", title = "Headphone Simulation of Free-Field Listening. I: Stimulus Synthesis", journal = "Journal of the Acoustical Society of America", year = 1989, volume = 85, number = 2, pages = "859-867", month = "February" } @Article{wightman89b, author = "Frederic L. Wightman and Doris J. Kistler", title = "Headphone Simulation of Free-Field Listening. II: Psychophysical Validation", journal = "Journal of the Acoustical Society of America", year = 1989, volume = 85, number = 2, pages = "868-878", month = "February" } @Article{plenge74, author = "G. Plenge", title = "On the Difference Between Localization and Lateralization", journal = "Journal of the Acoustical Society of America", year = 1974, volume = 56, number = 3, pages = "944-951", month = "September" } @InProceedings{wenzel91b, author = "Elizabeth M. Wenzel and Frederic L. Wightman and Doris J. Kistler", title = "Localization with Non-Individualized Virtual Acoustic Display Cues", booktitle = "CHI'91 Conference Proceedings: Reaching Through Technology", year = 1991, editor = "Scott P. Robertson and Gary M. Olson and Judith S. Olson", series = "Human Factors in Computing Systems", pages = "351-359", organization = "ACM SIGCHI", publisher = "ACM Press: Addison-Wesley", address = "New Orleans, Louisiana", month = "April 27 - May 2" } @InProceedings{gaver91b, author = "William W. Gaver", title = "Technology Affordances", booktitle = "CHI'91 Conference Proceedings: Reaching Through Technology", year = 1991, editor = "Scott P. Robertson and Gary M. Olson and Judith S. Olson", series = "Human Factors in Computing Systems", pages = "79-84", organization = "ACM SIGCHI", publisher = "ACM Press: Addison-Wesley", address = "New Orleans, Louisiana", month = "April 27 - May 2" } @InCollection{begault92a, author = "Durand R. Begault", title = "The Virtual Reality of 3-D Sound", booktitle = "Cyberarts: Exploring Art and Technology", publisher = "Miller-Freeman", year = 1992, editor = "Linda Jacobson", pages = "79-87", address = "San Francisco" } @InProceedings{begault92b, author = "Durand R. Begault", title = "An Introduction to 3-D Sound for Virtual Reality", booktitle = "Virtual Reality '92 Conference", year = 1992, editor = "Meckler", month = "Sep 23 - 25" } @Article{begault92c, author = "Durand R. Begault and Elizabeth M. Wenzel", title = "Techniques and Applications for Binaural Sound Manipulation in Human-Machine Interfaces", journal = "The International Journal of Aviation Psychology", year = 1992, volume = 2, number = 1, pages = "1-22" } @Article{begault92d, author = "Durand R. Begault", title = "Perceptual Effects of Synthetic Reverberation on Three-Dimensional Audio Systems", journal = "Journal of the Audio Engineering Society", year = 1992, volume = 40, number = 11, pages = "895-904", month = "November" } @InProceedings{begault92e, author = "Durand R. Begault", title = "Binaural Auralization and Perceptual Veridicality", booktitle = "93rd Convetion of the Audio Engineering Society in San Francisco", year = 1992, editor = "Thorburn, L. A. ", organization = "Audio Engineering Society", month = "October 1 - 4" } @Article{begault93, author = "Durand R. Begault", title = "Head-Up Auditory Displays for TCAS Advisories: A Preliminary Investigation", journal = "Human Factoris", year = 1993, note = "To appear" } @Book{lindsay72, author = "Peter H. Lindsay and Donald A. Norman", title = "Human Information Processing: An Introduction to Psychology", publisher = "Academic Press", year = 1972 } @Book{kantowitz83, author = "Barry H. Kantowitz and Robert D. Sorkin", title = "Human Factors: Understanding People-System Relationships", publisher = "John Wiley \& Sons", year = 1983 } @Book{moore82, author = "Benjamin C. J. Moore", title = "An Introduction to the Psychology of Hearing", publisher = "Academic Press", year = 1983, edition = "Second" } @Book{hamilton76, author = "Hamilton", title = "Textbook of Human Anatomy", publisher = "Macmillan", year = 1976 } @Article{vonBekesy47, author = "George von Bekesy", title = "The Variation of Phase Along the Basilar Membrane with Sinusoidal Vibrations", journal = "Journal of the Acoustical Society of America", year = 1947, volume = 19, pages = "452-460" } @Book{vonBekesy60, author = "Georg von Bekesy", title = "Experiments in Hearing", publisher = "McGraw-Hill", year = 1960, address = "New York" } @Book{apple90, author = "Apple Computer Inc.", title = "Guide to the Macintosh Family Hardware", publisher = "Addison-Wesley", year = 1990 } Ludwig, L. (1990). Extending the Notion of Window Systems to Audio. IEEE Computer 23 66-72. ---------------- I (Rob Arrabito, robbie@dretor.dciem.dnd.ca) performed an online search of articles written by Wenzel and McKinley which deal with 3d audio. Some of these overlapp with those listed above from Bowden Wise but these also contain abstracts. SYSTEM:OS - DIALOG OneSearch File 6:NTIS 1964-1993/Nov B1 File 63:TRIS 70-93/AUG File 108:Aerospace Database 1962-1993/Oct B1 ============================ ARTICLES BY ELIZABETH WENZEL ============================ 3/7/1 (Item 1 from file: 6) 1565492 NTIS Accession Number: N91-30697/7/XAB Three-Dimensional Virtual Acoustic Displays Wenzel, E. M. National Aeronautics and Space Administration, Moffett Field, CA. Ames Research Center. Corp. Source Codes: 019045001; NC473657 Report No.: NAS 1.15:103835; A-91061; NASA-TM-103835 Jul 91 36p Languages: English Journal Announcement: GRAI9201; STAR2922 NTIS Prices: PC A03/MF A01 Country of Publication: United States The development of an alternative medium for displaying information in complex human-machine interfaces is described. The 3-D virtual acoustic display is a means for accurately transferring information to a human operator using the auditory modality; it combines directional and semantic characteristics to form naturalistic representations of dynamic objects and events in remotely sensed or simulated environments. Although the technology can stand alone, it is envisioned as a component of a larger multisensory environment and will no doubt find its greatest utility in that context. The general philosophy in the design of the display has been that the development of advanced computer interfaces should be driven first by an understanding of human perceptual requirements, and later by technological capabilities or constraints. In expanding on this view, current and potential uses are addressed of virtual acoustic displays, such displays are characterized, and recent approaches to their implementation and application are reviewed, the research project at NASA-Ames is described in detail, and finally some critical research issues for the future are outlined. 3/7/2 (Item 2 from file: 6) 1544317 NTIS Accession Number: N91-23023/5/XAB Virtual Acoustics Displays Wenzel, E. M. ; Fisher, S. S. ; Stone, P. K. ; Foster, S. H. National Aeronautics and Space Administration, Moffett Field, CA. Ames Research Center. Corp. Source Codes: 019045001; NC473657 Mar 91 11p Languages: English Journal Announcement: GRAI9118; STAR2914 In National Aeronautics and Space Administration, Technology 2000, Volume 1 p 10-20. NTIS Prices: (Order as N91-23021/9, PC A18/MF A03) Country of Publication: United States The real time acoustic display capabilities are described which were developed for the Virtual Environment Workstation (VIEW) Project at NASA-Ames. The acoustic display is capable of generating localized acoustic cues in real time over headphones. An auditory symbology, a related collection of representational auditory 'objects' or 'icons', can be designed using ACE (Auditory Cue Editor), which links both discrete and continuously varying acoustic parameters with information or events in the display. During a given display scenario, the symbology can be dynamically coordinated in real time with 3-D visual objects, speech, and gestural displays. The types of displays feasible with the system range from simple warnings and alarms to the acoustic representation of multidimensional data or events. 3/7/3 (Item 3 from file: 6) 1513440 NTIS Accession Number: N91-13066/6/XAB Technical Aspects of a Demonstration Tape for Three-Dimensional Sound Displays Begault, D. R. ; Wenzel, E. M. National Aeronautics and Space Administration, Moffett Field, CA. Ames Research Center. Corp. Source Codes: 019045001; NC473657 Report No.: NAS 1.15:102826; A-90162; NASA-TM-102826 Oct 90 22p Languages: English Journal Announcement: GRAI9108; STAR2904 NTIS Prices: PC A03/MF A01 Country of Publication: United States This document was developed to accompany an audio cassette that demonstrates work in three-dimensional auditory displays, developed at the Ames Research Center Aerospace Human Factors Division. It provides a text version of the audio material, and covers the theoretical and technical issues of spatial auditory displays in greater depth than on the cassette. The technical procedures used in the production of the audio demonstration are documented, including the methods for simulating rotorcraft radio communication, synthesizing auditory icons, and using the Convolvotron, a real-time spatialization device. 3/7/4 (Item 4 from file: 6) 1499794 NTIS Accession Number: N90-28996/8/XAB Techniques and Applications for Binaural Sound Manipulation in Human-Machine Interfaces Begault, D. R. ; Wenzel, E. M. National Aeronautics and Space Administration, Moffett Field, CA. Ames Research Center. Corp. Source Codes: 019045001; NC473657 Report No.: NAS 1.15:102279; A-90066; NASA-TM-102279 Aug 90 27p Languages: English Journal Announcement: GRAI9103; STAR2823 NTIS Prices: PC A03/MF A01 Country of Publication: United States The implementation of binaural sound to speech and auditory sound cues (auditory icons) is addressed from both an applications and technical standpoint. Techniques overviewed include processing by means of filtering with head-related transfer functions. Application to advanced cockpit human interface systems is discussed, although the techniques are extendable to any human-machine interface. Research issues pertaining to three-dimensional sound displays under investigation at the Aerospace Human Factors Division at NASA Ames Research Center are described. 3/7/5 (Item 1 from file: 108) 1900830 A93-27143 Headphone localization of speech stimuli BEGAULT, DURAND R.; WENZEL, ELIZABETH M. (NASA, Ames Research Center, Moffett Field, CA) National Aeronautics and Space Administration. Ames Research Center, Moffett Field, CA. In: Human Factors Society, Annual Meeting, 35th, San Francisco, CA, Sept. 2-6, 1991, Proceedings. Vol. 1 (A93-27126 09-54). Santa Monica, CA, Human Factors Society, 1991, p. 82-86. Research supported by FAA and National Research Council. Publication Date: 1991 18 Refs. Language: English Country of Origin: United States Country of Publication: United States Document Type: CONFERENCE PAPER Documents available from AIAA Technical Library Journal Announcement: IAA9309 Recently, three dimensional acoustic display systems have been developed that synthesize virtual sound sources over headphones based on filtering by Head-Related Transfer Functions (HRTFs), the direction-dependent spectral changes caused primarily by the outer ears. Here, 11 inexperienced subjects judged the apparent spatial location of headphone-presented speech stimuli filtered with non-individualized HRTFs. About half of the subjects 'pulled' their judgements toward either the median or the lateral-vertical planes, and estimates were almost always elevated. Individual differences were pronounced for the distance judgements; 15 to 46 percent of stimuli were heard inside the head with the shortest estimates near the median plane. The results infer that most listeners can obtain useful azimuth information from speech stimuli filtered by nonindividualized RTFs. Measurements of localization error and reversal rates are comparable with a previous study that used broadband noise stimuli. (Author) Source of Abstract/Subfile: AIAA/TIS 3/7/6 (Item 2 from file: 108) 1638678 A89-31617 Virtual interface environment workstations FISHER, S. S.; WENZEL, E. M.; COLER, C.; MCGREEVY, M. W. (NASA, Ames Research Center, Moffett Field, CA) National Aeronautics and Space Administration. Ames Research Center, Moffett Field, CA. IN: Human Factors Society, Annual Meeting, 32nd, Anaheim, CA, Oct. 24-28, 1988, Proceedings. Volume 1 (A89-31601 12-54). Santa Monica, CA, Human Factors Society, 1988, p. 91-95. Publication Date: 1988 Language: English Country of Origin: United States Country of Publication: United States Document Type: CONFERENCE PAPER Documents available from AIAA Technical Library Journal Announcement: IAA8912 A head-mounted, wide-angle, stereoscopic display system controlled by operator position, voice and gesture has been developed at NASA's Ames Research Center for use as a multipurpose interface environment. This Virtual Interface Environment Workstation (VIEW) system provides a multisensory, interactive display environment in which a user can virtually explore a 360-degree synthesized or remotely sensed environment and can viscerally interact with its components. Primary applications of the system are in telerobotics, management of large-scale integrated information systems, and human factors research. System configuration, research scenarios, and research directions are described. (Author) Source of Abstract/Subfile: AIAA/TIS 3/7/7 (Item 3 from file: 108) 1638677 A89-31616 A virtual display system for conveying three-dimensional acoustic information WENZEL, ELIZABETH M. (NASA, Ames Research Center, Moffett Field, CA); WIGHTMAN, FREDERIC L. (Wisconsin, University, Madison); FOSTER, SCOTT H. (Crystal River Engineering, Groveland, CA) National Aeronautics and Space Administration. Ames Research Center, Moffett Field, CA. IN: Human Factors Society, Annual Meeting, 32nd, Anaheim, CA, Oct. 24-28, 1988, Proceedings. Volume 1 (A89-31601 12-54). Santa Monica, CA, Human Factors Society, 1988, p. 86-90. Publication Date: 1988 15 Refs. Language: English Country of Origin: United States Country of Publication: United States Document Type: CONFERENCE PAPER Documents available from AIAA Technical Library Journal Announcement: IAA8912 The development of a three-dimensional auditory display system is discussed. Theories of human sound localization and techniques for synthesizing various features of auditory spatial perceptions are examined. Psychophysical data validating the system are presented. The human factors applications of the system are considered. (R.B.) Source of Abstract/Subfile: AIAA/TIS 3/7/8 (Item 4 from file: 108) 1510380 A87-33061 Effects of stimulus characteristics and task demands on pilots' perception of dichotic messages WENZEL, ELIZABETH M. (NASA, Ames Research Center, Moffett Field, CA) National Aeronautics and Space Administration. Ames Research Center, Moffett Field, Calif. IN: Human Factors Society, Annual Meeting, 30th, Dayton, OH, Sept. 29-Oct. 3, 1986, Proceedings. Volume 2 (A87-33001 13-54). Santa Monica, CA, Human Factors Society, 1986, p. 1177-1181. Publication Date: 1986 9 Refs. Language: English Country of Origin: United States Country of Publication: United States Document Type: CONFERENCE PAPER Documents available from AIAA Technical Library Journal Announcement: IAA8713 The experiment is an initial investigation of pilot performance when auditory advisory messages are presented dichotically, either with or without a concurrent pursuit task requiring visual/motor dexterity. The dependent measures were percent correct and correct reaction times for manual responses to the auditory messages. Two stimulus variables which show facilitory effects in traditional dichotic-listening paradigms, differences in pitch and semantic content of the messages, were examined to determine their effectiveness during the functional simulation of helicopter pursuit. In an effort to accumulate points for the advisory messages for accuracy alone or for both accuracy and reaction times which were faster than their opponent's. In general, the combined effects of the stimulus and task variables are additive. When interactions do occur they suggest that an increase in task demands can sometimes mitigate, but usually does not remove, any processing advantages accrued from stimulus characteristics. The implications of these results for cockpit displays are discussed. (Author) Source of Abstract/Subfile: AIAA/TIS ============================ ARTICLES BY RICHARD McKINLEY ============================ 4/7/1 (Item 1 from file: 6) 1696632 NTIS Accession Number: AD-A265 563/7/XAB Human Auditory Localization Performance in Azimuth (Final rept. Oct 85-Jan 91) Ericson, M. A. ; McKinley, R. L. ; Valencia, G. Armstrong Lab., Wright-Patterson AFB, OH. Corp. Source Codes: 103202000; 424167 Report No.: AL-TR-1991-0080 Jan 91 30p Languages: English Journal Announcement: GRAI9318 NTIS Prices: PC A03/MF A01 Country of Publication: United States Contract No.: 7231; 39 The Harry G. Armstrong Aerospace Medical Research Laboratory developed a unique research auditory localization facility for special, in-depth investigations of human auditory localization phenomena. A study was conducted in the facility to measure localization performance with three types of acoustic signal in azimuth; (1) natural, free-field acoustic cues heard with the ears uncovered, (2) simulated cues recorded at the ears of an acoustic manikin and presented over headphones, and (3) acoustic cues generated by an electronic auditory localization cue synthesizer and presented over headphones. Purposes of the study were (1) to evaluate relative localization accuracy and response time with the free-field, simulated and synthesized cues, (2) to examine the feasibility of localization of synthesized cues over headphones, and (3) to establish data base of human auditory localization performance with these signals. Results across the three conditions averaged about 5 to 6 degrees in accuracy (magnitude error) and 3.5 to 4.5 seconds in response time. Localization performance with simulated and synthesized cues was essentially equivalent to natural (free-field) cues, demonstrating the capability of the localization cue synthesizer to present realistic directional sounds in azimuth. 4/7/4 (Item 4 from file: 6) 1373877 NTIS Accession Number: AD-A203 053/4/XAB Concept and Design of an Auditory Localization Cue Synthesizer (Master's thesis) McKinley, R. L. Air Force Inst. of Tech., Wright-Patterson AFB, OH. School of Engineering. Corp. Source Codes: 000805002; 012225 Report No.: AFIT/GE/ENG/88D-29 Dec 88 89p Languages: English Document Type: Thesis Journal Announcement: GRAI8910 NTIS Prices: PC A05/MF A01 Country of Publication: United States The purpose of this thesis was to develop the concept and basic design for an auditory localization cue synthesizer. This technology has the potential for greatly reducing threat acquisition times in hostile ground-to-air missile scenarios by providing the pilot with a heads-up localizable auditory warning over his headset. This warning allows the pilot to quickly and naturally determine the location of the threat and take the necessary evasive actions. The pertinent literature was reviewed and used to form the basis of the concept to generate localization cues over headphones utilizing real-time solid state processor. The synthesizer accepts a single monaural input and processes the signal separately for independent presentation to the left and right ears. The synthesizer uses a 3-space head tracking device to maintain a stable acoustic image when the listener moves his head. The design is complete to present localized stimuli in azimuth. A concept is described for generating stimuli in the three dimensional case for azimuth, elevation and distance. Details of the hardware and software design are in the appendices. Laboratory methodology are described for deriving the necessary parameters of the synthesizer. Experimental data collected separately from this thesis demonstrate that the concept and design are viable for the azimuth case. Localization errors with the synthesizer are compared with free field errors obtained with 10 subjects. The results show that localization accuracy is essentially equal for the two conditions. Recommendations are presented for further research and development. (KR) 4/7/16 (Item 1 from file: 108) 1702906 A90-30728 Auditory localization cue synthesis and human performance ERICSON, MARK A.; MCKINLEY, RICHARD L. (USAF, Armstrong Aerospace Medical Research Laboratory, Wright-Patterson AFB, OH) IN: NAECON 89; Proceedings of the IEEE National Aerospace and Electronics Conference, Dayton, OH, May 22-26, 1989. Volume 2 (A90-30676 12-01). New York, Institute of Electrical and Electronics Engineers, Inc., 1989, p. 718-725. Publication Date: 1989 Language: English Country of Origin: United States Country of Publication: United States Document Type: CONFERENCE PAPER Documents available from AIAA Technical Library Journal Announcement: IAA9012 Directional audio technology for headphone applications is being developed. A laboratory demonstration model of a real-time digital auditory localization cue synthesizer is integrated wih a head position tracker, A/D and D/A converters, and a host computer to form a directional audio display (DIRAD). The DIRAD presents sounds over headphones that are perceived to be outside of the listener's head and relatively easy to localize. Possible military applications of DIRAD include integration with radar warning receivers, voice communication systems, and collision avoidance systems. Performance experiments demonstrated the ability of humans to localize sounds over headphones. Overall mean magnitude errors of 6.0 deg were measured in the control condition and 4.8 deg with the DIRAD. Mean response times of 3.5 sec in the control condition and 4.3 sec with the DIRAD were measured. (I.E.) Source of Abstract/Subfile: AIAA/TIS -- Lance Norskog thinman@netcom.com Data is not information is not knowledge is not wisdom.