@article{Sumana-2021-Towards,
title = "Towards Automatically Generating Release Notes using Extractive Summarization Technique",
author = "Sumana, Sristy and
Sumana, Sristy",
journal = "Proceedings of the 33rd International Conference on Software Engineering and Knowledge Engineering",
year = "2021",
publisher = "KSI Research Inc.",
url = "https://gwf-uwaterloo.github.io/gwf-publications/G21-21002",
doi = "10.18293/seke2021-119",
abstract = "Release notes are admitted as an essential document by practitioners. They contain the summary of the source code changes for the software releases, such as issue fixes, added new features, and performance improvements. Manually producing release notes is a time-consuming and challenging task. For that reason, sometimes developers neglect to write release notes. For example, we collect data from GitHub with over 1,900 releases, among them 37{\%} of the release notes are empty. We propose an automatic generate release notes approach based on the commit messages and merge pull-request (PR) titles to mitigate this problem. We implement one of the popular extractive text summarization techniques, i.e., the TextRank algorithm. However, accurate keyword extraction is a vital issue in text processing. The keyword matching and topic extraction process of the TextRank algorithm ignores the semantic similarity among texts. To improve the keyword extraction method, we integrate the GloVe word embedding technique with TextRank. We develop a dataset with 1,213 release notes (after null filtering) and evaluate the generated release notes through the ROUGE metric and human evaluation. We also compare the performance of our technique with another popular extractive algorithm, latent semantic analysis (LSA). Our evaluation results show that the improved TextRank method outperforms LSA.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="Sumana-2021-Towards">
<titleInfo>
<title>Towards Automatically Generating Release Notes using Extractive Summarization Technique</title>
</titleInfo>
<name type="personal">
<namePart type="given">Sristy</namePart>
<namePart type="family">Sumana</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2021</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<genre authority="bibutilsgt">journal article</genre>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 33rd International Conference on Software Engineering and Knowledge Engineering</title>
</titleInfo>
<originInfo>
<issuance>continuing</issuance>
<publisher>KSI Research Inc.</publisher>
</originInfo>
<genre authority="marcgt">periodical</genre>
<genre authority="bibutilsgt">academic journal</genre>
</relatedItem>
<abstract>Release notes are admitted as an essential document by practitioners. They contain the summary of the source code changes for the software releases, such as issue fixes, added new features, and performance improvements. Manually producing release notes is a time-consuming and challenging task. For that reason, sometimes developers neglect to write release notes. For example, we collect data from GitHub with over 1,900 releases, among them 37% of the release notes are empty. We propose an automatic generate release notes approach based on the commit messages and merge pull-request (PR) titles to mitigate this problem. We implement one of the popular extractive text summarization techniques, i.e., the TextRank algorithm. However, accurate keyword extraction is a vital issue in text processing. The keyword matching and topic extraction process of the TextRank algorithm ignores the semantic similarity among texts. To improve the keyword extraction method, we integrate the GloVe word embedding technique with TextRank. We develop a dataset with 1,213 release notes (after null filtering) and evaluate the generated release notes through the ROUGE metric and human evaluation. We also compare the performance of our technique with another popular extractive algorithm, latent semantic analysis (LSA). Our evaluation results show that the improved TextRank method outperforms LSA.</abstract>
<identifier type="citekey">Sumana-2021-Towards</identifier>
<identifier type="doi">10.18293/seke2021-119</identifier>
<location>
<url>https://gwf-uwaterloo.github.io/gwf-publications/G21-21002</url>
</location>
<part>
<date>2021</date>
</part>
</mods>
</modsCollection>
%0 Journal Article
%T Towards Automatically Generating Release Notes using Extractive Summarization Technique
%A Sumana, Sristy
%J Proceedings of the 33rd International Conference on Software Engineering and Knowledge Engineering
%D 2021
%I KSI Research Inc.
%F Sumana-2021-Towards
%X Release notes are admitted as an essential document by practitioners. They contain the summary of the source code changes for the software releases, such as issue fixes, added new features, and performance improvements. Manually producing release notes is a time-consuming and challenging task. For that reason, sometimes developers neglect to write release notes. For example, we collect data from GitHub with over 1,900 releases, among them 37% of the release notes are empty. We propose an automatic generate release notes approach based on the commit messages and merge pull-request (PR) titles to mitigate this problem. We implement one of the popular extractive text summarization techniques, i.e., the TextRank algorithm. However, accurate keyword extraction is a vital issue in text processing. The keyword matching and topic extraction process of the TextRank algorithm ignores the semantic similarity among texts. To improve the keyword extraction method, we integrate the GloVe word embedding technique with TextRank. We develop a dataset with 1,213 release notes (after null filtering) and evaluate the generated release notes through the ROUGE metric and human evaluation. We also compare the performance of our technique with another popular extractive algorithm, latent semantic analysis (LSA). Our evaluation results show that the improved TextRank method outperforms LSA.
%R 10.18293/seke2021-119
%U https://gwf-uwaterloo.github.io/gwf-publications/G21-21002
%U https://doi.org/10.18293/seke2021-119
Markdown (Informal)
[Towards Automatically Generating Release Notes using Extractive Summarization Technique](https://gwf-uwaterloo.github.io/gwf-publications/G21-21002) (Sumana & Sumana, GWF 2021)
ACL
- Sristy Sumana and Sristy Sumana. 2021. Towards Automatically Generating Release Notes using Extractive Summarization Technique. Proceedings of the 33rd International Conference on Software Engineering and Knowledge Engineering.