<br><br>@inproceedings{10.1145/3491102.3517582,<br />
author = {Wu, Tongshuang and Terry, Michael and Cai, Carrie Jun},<br />
title = {AI Chains: Transparent and Controllable Human-AI Interaction by Chaining Large Language Model Prompts},<br />
year = {2022},<br />
isbn = {9781450391573},<br />
publisher = {Association for Computing Machinery},<br />
address = {New York, NY, USA},<br />
url = {https://doi.org/10.1145/3491102.3517582},<br />
doi = {10.1145/3491102.3517582},<br />
abstract = {Although large language models (LLMs) have demonstrated impressive potential on simple tasks, their breadth of scope, lack of transparency, and insufficient controllability can make them less effective when assisting humans on more complex tasks. In response, we introduce the concept of Chaining LLM steps together, where the output of one step becomes the input for the next, thus aggregating the gains per step. We first define a set of LLM primitive operations useful for Chain construction, then present an interactive system where users can modify these Chains, along with their intermediate results, in a modular way. In a 20-person user study, we found that Chaining not only improved the quality of task outcomes, but also significantly enhanced system transparency, controllability, and sense of collaboration. Additionally, we saw that users developed new ways of interacting with LLMs through Chains: they leveraged sub-tasks to calibrate model expectations, compared and contrasted alternative strategies by observing parallel downstream effects, and debugged unexpected model outputs by “unit-testing” sub-components of a Chain. In two case studies, we further explore how LLM Chains may be used in future applications.},<br />
booktitle = {Proceedings of the 2022 CHI Conference on Human Factors in Computing Systems},<br />
articleno = {385},<br />
numpages = {22},<br />
keywords = {Large Language Models, Natural Language Processing, Human-AI Interaction},<br />
location = {New Orleans, LA, USA},<br />
series = {CHI '22},<br />
month = {04}<br />
}<br />
<br><br>@inproceedings{10.1145/3490099.3511105,<br />
author = {Yuan, Ann and Coenen, Andy and Reif, Emily and Ippolito, Daphne},<br />
title = {Wordcraft: Story Writing With Large Language Models},<br />
year = {2022},<br />
isbn = {9781450391443},<br />
publisher = {Association for Computing Machinery},<br />
address = {New York, NY, USA},<br />
url = {https://doi.org/10.1145/3490099.3511105},<br />
doi = {10.1145/3490099.3511105},<br />
abstract = {The latest generation of large neural language models such as GPT-3 have achieved new levels of performance on benchmarks for language understanding and generation. These models have even demonstrated an ability to perform arbitrary tasks without explicit training. In this work, we sought to learn how people might use such models in the process of creative writing. We built Wordcraft, a text editor in which users collaborate with a generative language model to write a story. We evaluated Wordcraft with a user study in which participants wrote short stories with and without the tool. Our results show that large language models enable novel co-writing experiences. For example, the language model is able to engage in open-ended conversation about the story, respond to writers’ custom requests expressed in natural language (such as ”rewrite this text to be more Dickensian”), and generate suggestions that serve to unblock writers in the creative process. Based on these results, we discuss design implications for future human-AI co-writing systems.},<br />
booktitle = {27th International Conference on Intelligent User Interfaces},<br />
pages = {841–852},<br />
numpages = {12},<br />
keywords = {NLP},<br />
location = {Helsinki, Finland},<br />
series = {IUI '22},<br />
month = {03}<br />
}<br />
<br><br>@misc{dibia2023lida,<br />
title = {LIDA: A Tool for Automatic Generation of Grammar-Agnostic Visualizations and Infographics using Large Language Models},<br />
author = {Victor Dibia},<br />
year = {2023},<br />
eprint = {2303.02927},<br />
archivePrefix = {arXiv},<br />
primaryClass = {cs.AI},<br />
month = {03}<br />
}<br />
<br><br>@misc{jiang2023graphologue,<br />
title = {Graphologue: Exploring Large Language Model Responses with Interactive Diagrams},<br />
author = {Peiling Jiang and Jude Rayan and Steven P. Dow and Haijun Xia},<br />
year = {2023},<br />
eprint = {2305.11473},<br />
archivePrefix = {arXiv},<br />
primaryClass = {cs.HC},<br />
month = {05}<br />
}<br />
<br><br>@inproceedings{10.1145/3544548.3581560,<br />
author = {Valencia, Stephanie and Cave, Richard and Kallarackal, Krystal and Seaver, Katie and Terry, Michael and Kane, Shaun K.},<br />
title = {“The Less I Type, the Better”: How AI Language Models Can Enhance or Impede Communication for AAC Users},<br />
year = {2023},<br />
isbn = {9781450394215},<br />
publisher = {Association for Computing Machinery},<br />
address = {New York, NY, USA},<br />
url = {https://doi.org/10.1145/3544548.3581560},<br />
doi = {10.1145/3544548.3581560},<br />
abstract = {Users of augmentative and alternative communication (AAC) devices sometimes find it difficult to communicate in real time with others due to the time it takes to compose messages. AI technologies such as large language models (LLMs) provide an opportunity to support AAC users by improving the quality and variety of text suggestions. However, these technologies may fundamentally change how users interact with AAC devices as users transition from typing their own phrases to prompting and selecting AI-generated phrases. We conducted a study in which 12 AAC users tested live suggestions from a language model across three usage scenarios: extending short replies, answering biographical questions, and requesting assistance. Our study participants believed that AI-generated phrases could save time, physical and cognitive effort when communicating, but felt it was important that these phrases reflect their own communication style and preferences. This work identifies opportunities and challenges for future AI-enhanced AAC devices.},<br />
booktitle = {Proceedings of the 2023 CHI Conference on Human Factors in Computing Systems},<br />
articleno = {830},<br />
numpages = {14},<br />
keywords = {communication, artificial intelligence, large language models, accessibility},<br />
location = {Hamburg, Germany},<br />
series = {CHI '23},<br />
month = {04}<br />
}<br />
<br><br>@misc{koh2023generating,<br />
title = {Generating Images with Multimodal Language Models},<br />
author = {Jing Yu Koh and Daniel Fried and Ruslan Salakhutdinov},<br />
year = {2023},<br />
eprint = {2305.17216},<br />
archivePrefix = {arXiv},<br />
primaryClass = {cs.CL},<br />
month = {05}<br />
}<br />
<br><br>@misc{cai2023lowcode,<br />
title = {Low-code LLM: Visual Programming over LLMs},<br />
author = {Yuzhe Cai and Shaoguang Mao and Wenshan Wu and Zehua Wang and Yaobo Liang and Tao Ge and Chenfei Wu and Wang You and Ting Song and Yan Xia and Jonathan Tien and Nan Duan},<br />
year = {2023},<br />
eprint = {2304.08103},<br />
archivePrefix = {arXiv},<br />
primaryClass = {cs.CL},<br />
month = {04}<br />
}<br />
<br><br>@inproceedings{swanson-etal-2021-story,<br />
title = {Story Centaur: Large Language Model Few Shot Learning as a Creative Writing Tool},<br />
author = {Swanson, Ben  and<br />
      Mathewson, Kory  and<br />
      Pietrzak, Ben  and<br />
      Chen, Sherol  and<br />
      Dinalescu, Monica},<br />
booktitle = {Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: System Demonstrations},<br />
month = {04},<br />
year = {2021},<br />
address = {Online},<br />
publisher = {Association for Computational Linguistics},<br />
url = {https://aclanthology.org/2021.eacl-demos.29},<br />
doi = {10.18653/v1/2021.eacl-demos.29},<br />
pages = {244--256},<br />
abstract = {Few shot learning with large language models has the potential to give individuals without formal machine learning training the access to a wide range of text to text models. We consider how this applies to creative writers and present Story Centaur, a user interface for prototyping few shot models and a set of recombinable web components that deploy them. Story Centaur{'}s goal is to expose creative writers to few shot learning with a simple but powerful interface that lets them compose their own co-creation tools that further their own unique artistic directions. We build out several examples of such tools, and in the process probe the boundaries and issues surrounding generation with large language models.}<br />
}<br />
<br><br>@misc{mishra2023promptaid,<br />
title = {PromptAid: Prompt Exploration, Perturbation, Testing and Iteration using Visual Analytics for Large Language Models},<br />
author = {Aditi Mishra and Utkarsh Soni and Anjana Arunkumar and Jinbin Huang and Bum Chul Kwon and Chris Bryan},<br />
year = {2023},<br />
eprint = {2304.01964},<br />
archivePrefix = {arXiv},<br />
primaryClass = {cs.HC},<br />
month = {04}<br />
}<br />
<br><br>@article{akoury2020storium,<br />
title = {Hierarchical neural story generation},<br />
author = {Fan, Angela and Lewis, Mike and Dauphin, Yann},<br />
journal = {arXiv preprint arXiv:1805.04833},<br />
year = {2018},<br />
month = {12}<br />
}<br />
<br><br>@article{akoury2020storium,<br />
title = {Attention is all you need},<br />
author = {Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, {\L}ukasz and Polosukhin, Illia},<br />
journal = {Advances in neural information processing systems},<br />
volume = {30},<br />
year = {2017},<br />
month = {12}<br />
}<br />
<br><br>@inproceedings{10.1145/3544548.3581196,<br />
author = {Jakesch, Maurice and Bhat, Advait and Buschek, Daniel and Zalmanson, Lior and Naaman, Mor},<br />
title = {Co-Writing with Opinionated Language Models Affects Users’ Views},<br />
year = {2023},<br />
isbn = {9781450394215},<br />
publisher = {Association for Computing Machinery},<br />
address = {New York, NY, USA},<br />
url = {https://doi.org/10.1145/3544548.3581196},<br />
doi = {10.1145/3544548.3581196},<br />
abstract = {If large language models like GPT-3 preferably produce a particular point of view, they may influence people’s opinions on an unknown scale. This study investigates whether a language-model-powered writing assistant that generates some opinions more often than others impacts what users write – and what they think. In an online experiment, we asked participants (N=1,506) to write a post discussing whether social media is good for society. Treatment group participants used a language-model-powered writing assistant configured to argue that social media is good or bad for society. Participants then completed a social media attitude survey, and independent judges (N=500) evaluated the opinions expressed in their writing. Using the opinionated language model affected the opinions expressed in participants’ writing and shifted their opinions in the subsequent attitude survey. We discuss the wider implications of our results and argue that the opinions built into AI language technologies need to be monitored and engineered more carefully.},<br />
booktitle = {Proceedings of the 2023 CHI Conference on Human Factors in Computing Systems},<br />
articleno = {111},<br />
numpages = {15},<br />
keywords = {GPT-3, risks of large language models, Co-writing, opinion change},<br />
location = {Hamburg, Germany},<br />
series = {CHI '23},<br />
month = {04}<br />
}<br />
<br><br>@InProceedings{10.1145/3544548.3580969,<br />
author = {Bala, Paulo<br />
and James, Stuart<br />
and Del Bue, Alessio<br />
and Nisi, Valentina},<br />
editor = {Vosmeer, Mirjam<br />
and Holloway-Attaway, Lissa},<br />
title = {Writing with (Digital) Scissors: Designing a Text Editing Tool for Assisted Storytelling Using Crowd-Generated Content},<br />
booktitle = {Interactive Storytelling},<br />
year = {2022},<br />
publisher = {Springer International Publishing},<br />
address = {Cham},<br />
pages = {139--158},<br />
abstract = {Digital Storytelling can exploit numerous technologies and sources of information to support the creation, refinement and enhancement of a narrative. Research on text editing tools has created novel interactions that support authors in different stages of the creative process, such as the inclusion of crowd-generated content for writing. While these interactions have the potential to change workflows, integration of these in a way that is useful and matches users' needs is unclear. In order to investigate the space of Assisted Storytelling, we designed and conducted a study to analyze how users write and edit a story about Cultural Heritage using an auxiliary source like Wikipedia. Through a diffractive analysis of stories, creative processes, and social and cultural contexts, we reflect and derive implications for design. These were applied to develop an AI-supported text editing tool using crowd-sourced content from Wikipedia and Wikidata.},<br />
isbn = {978-3-031-22298-6},<br />
month = {12}<br />
}<br />
<br><br>@inproceedings{10.1145/3526113.3545672,<br />
author = {Dang, Hai and Benharrak, Karim and Lehmann, Florian and Buschek, Daniel},<br />
title = {Beyond Text Generation: Supporting Writers with Continuous Automatic Text Summaries},<br />
year = {2022},<br />
isbn = {9781450393201},<br />
publisher = {Association for Computing Machinery},<br />
address = {New York, NY, USA},<br />
url = {https://doi.org/10.1145/3526113.3545672},<br />
doi = {10.1145/3526113.3545672},<br />
abstract = {We propose a text editor to help users plan, structure and reflect on their writing process. It provides continuously updated paragraph-wise summaries as margin annotations, using automatic text summarization. Summary levels range from full text, to selected (central) sentences, down to a collection of keywords. To understand how users interact with this system during writing, we conducted two user studies (N=4 and N=8) in which people wrote analytic essays about a given topic and article. As a key finding, the summaries gave users an external perspective on their writing and helped them to revise the content and scope of their drafted paragraphs. People further used the tool to quickly gain an overview of the text and developed strategies to integrate insights from the automated summaries. More broadly, this work explores and highlights the value of designing AI tools for writers, with Natural Language Processing (NLP) capabilities that go beyond direct text generation and correction.},<br />
booktitle = {Proceedings of the 35th Annual ACM Symposium on User Interface Software and Technology},<br />
articleno = {98},<br />
numpages = {13},<br />
keywords = {semantic zoom, text summarization, Natural Language Processing, reverse outlining, Text documents},<br />
location = {Bend, OR, USA},<br />
series = {UIST '22},<br />
month = {10}<br />
}<br />
<br><br>@inproceedings{yang2022ai,<br />
title = {AI as an Active Writer: Interaction strategies with generated text in human-AI collaborative fiction writing},<br />
author = {Yang, Daijin and Zhou, Yanpeng and Zhang, Zhiyuan and Li, Toby Jia-Jun and LC, Ray},<br />
booktitle = {Joint Proceedings of the ACM IUI Workshops},<br />
volume = {10},<br />
year = {2022},<br />
organization = {CEUR-WS Team},<br />
month = {12}<br />
}<br />
<br><br>@article{yang2022ai,<br />
author = {Singh, Nikhil and Bernal, Guillermo and Savchenko, Daria and Glassman, Elena L.},<br />
title = {Where to Hide a Stolen Elephant: Leaps in Creative Writing with Multimodal Machine Intelligence},<br />
year = {2022},<br />
publisher = {Association for Computing Machinery},<br />
address = {New York, NY, USA},<br />
issn = {1073-0516},<br />
url = {https://doi.org/10.1145/3511599},<br />
doi = {10.1145/3511599},<br />
abstract = {While developing a story, novices and published writers alike have had to look outside themselves for inspiration. Language models have recently been able to generate text fluently, producing new stochastic narratives upon request. However, effectively integrating such capabilities with human cognitive faculties and creative processes remains challenging. We propose to investigate this integration with a multimodal writing support interface that offers writing suggestions textually, visually, and aurally. We conduct an extensive study that combines elicitation of prior expectations before writing, observation and semi-structured interviews during writing, and outcome evaluations after writing. Our results illustrate individual and situational variation in machine-in-the-loop writing approaches, suggestion acceptance, and ways the system is helpful. Centrally, we report how participants perform integrative leaps, by which they do cognitive work to integrate suggestions of varying semantic relevance into their developing stories. We interpret these findings, offering modeling and design recommendations for future creative writing support technologies.},<br />
note = {Just Accepted},<br />
journal = {ACM Trans. Comput.-Hum. Interact.},<br />
month = {02},<br />
keywords = {multimodal, audio, interface, images, human-AI interaction, writing, AI, story, audiovisual, creativity support}<br />
}<br />
<br><br>@inproceedings{10.1609/aiide.v18i1.21955,<br />
author = {Kreminski, Max and Dickinson, Melanie and Wardrip-Fruin, Noah and Mateas, Michael},<br />
title = {Loose Ends: A Mixed-Initiative Creative Interface for Playful Storytelling},<br />
year = {2022},<br />
isbn = {978-1-57735-877-0},<br />
publisher = {AAAI Press},<br />
url = {https://doi.org/10.1609/aiide.v18i1.21955},<br />
doi = {10.1609/aiide.v18i1.21955},<br />
abstract = {We present Loose Ends, a mixed-initiative co-creative storytelling play experience in which a human player and an AI system work together to compose a story. Loose Ends specifically aims to provide computational support for managing multiple parallel plot threads and bringing these threads to satisfying conclusions—something that has proven difficult in past attempts to facilitate playful mixed-initiative storytelling. We describe the overall human-AI interaction loop in Loose Ends, including the implementation of the rules-based AI system that enables this interaction loop; discuss four examples of desirable mixed-initiative interactions that are possible in Loose Ends, but not in similar systems; and present results from a preliminary expert evaluation of Loose Ends. Altogether, we find that Loose Ends shows promise for creating a sense of coauthorship in the player while also mitigating the directionlessness reported by players of earlier systems.},<br />
booktitle = {Proceedings of the Eighteenth AAAI Conference on Artificial Intelligence and Interactive Digital Entertainment},<br />
articleno = {15},<br />
numpages = {9},<br />
location = {Pomona, CA, USA},<br />
series = {AIIDE'22},<br />
month = {12}<br />
}<br />
<br><br>@misc{10.1609/aiide.v18i1.21955,<br />
title = {Parachute: Evaluating Interactive Human-LM Co-writing Systems},<br />
author = {Hua Shen and Tongshuang Wu},<br />
year = {2023},<br />
eprint = {2303.06333},<br />
archivePrefix = {arXiv},<br />
primaryClass = {cs.HC},<br />
month = {03}<br />
}<br />
<br><br>@inproceedings{10.1609/aiide.v18i1.21955,<br />
title = {What Can’t Large Language Models Do? The Future of AI-Assisted Academic Writing},<br />
author = {Fok, Raymond and Weld, Daniel S},<br />
booktitle = {In2Writing Workshop at CHI},<br />
year = {2023},<br />
month = {12}<br />
}<br />