From ade494bf6f38294c2270dee21e7771e5b41149e5 Mon Sep 17 00:00:00 2001 From: Boris Baldassari <boris@chrysalice.org> Date: Sat, 19 Dec 2020 19:19:06 +0100 Subject: [PATCH] #5 Web site refactoring -- update. --- docs/scava.html | 67 ++++++-- docs/scava_datasets.html | 324 --------------------------------------- docs/scava_datasets.md | 57 ------- 3 files changed, 51 insertions(+), 397 deletions(-) delete mode 100644 docs/scava_datasets.html delete mode 100644 docs/scava_datasets.md diff --git a/docs/scava.html b/docs/scava.html index 8bf0809..9da6ebf 100644 --- a/docs/scava.html +++ b/docs/scava.html @@ -13,8 +13,7 @@ - - <style> + <style> /** * prism.js Github theme based on GitHub's theme. * @author Sam Clarke @@ -254,28 +253,71 @@ pre[data-line] .line-highlight[data-end]:after { content: attr(data-end); top: auto; bottom: .4em; -}html body{font-family:"Helvetica Neue",Helvetica,"Segoe UI",Arial,freesans,sans-serif;font-size:16px;line-height:1.6;color:#333;background-color:#fff;overflow:initial;box-sizing:border-box;word-wrap:break-word}html body>:first-child{margin-top:0}html body h1,html body h2,html body h3,html body h4,html body h5,html body h6{line-height:1.2;margin-top:1em;margin-bottom:16px;color:#000}html body h1{font-size:2.25em;font-weight:300;padding-bottom:.3em}html body h2{font-size:1.75em;font-weight:400;padding-bottom:.3em}html body h3{font-size:1.5em;font-weight:500}html body h4{font-size:1.25em;font-weight:600}html body h5{font-size:1.1em;font-weight:600}html body h6{font-size:1em;font-weight:600}html body h1,html body h2,html body h3,html body h4,html body h5{font-weight:600}html body h5{font-size:1em}html body h6{color:#5c5c5c}html body strong{color:#000}html body del{color:#5c5c5c}html body a:not([href]){color:inherit;text-decoration:none}html body a{color:#08c;text-decoration:none}html body a:hover{color:#00a3f5;text-decoration:none}html body img{max-width:100%}html body>p{margin-top:0;margin-bottom:16px;word-wrap:break-word}html body>ul,html body>ol{margin-bottom:16px}html body ul,html body ol{padding-left:2em}html body ul.no-list,html body ol.no-list{padding:0;list-style-type:none}html body ul ul,html body ul ol,html body ol ol,html body ol ul{margin-top:0;margin-bottom:0}html body li{margin-bottom:0}html body li.task-list-item{list-style:none}html body li>p{margin-top:0;margin-bottom:0}html body .task-list-item-checkbox{margin:0 .2em .25em -1.8em;vertical-align:middle}html body .task-list-item-checkbox:hover{cursor:pointer}html body blockquote{margin:16px 0;font-size:inherit;padding:0 15px;color:#5c5c5c;border-left:4px solid #d6d6d6}html body blockquote>:first-child{margin-top:0}html body blockquote>:last-child{margin-bottom:0}html body hr{height:4px;margin:32px 0;background-color:#d6d6d6;border:0 none}html body table{margin:10px 0 15px 0;border-collapse:collapse;border-spacing:0;display:block;width:100%;overflow:auto;word-break:normal;word-break:keep-all}html body table th{font-weight:bold;color:#000}html body table td,html body table th{border:1px solid #d6d6d6;padding:6px 13px}html body dl{padding:0}html body dl dt{padding:0;margin-top:16px;font-size:1em;font-style:italic;font-weight:bold}html body dl dd{padding:0 16px;margin-bottom:16px}html body code{font-family:Menlo,Monaco,Consolas,'Courier New',monospace;font-size:.85em !important;color:#000;background-color:#f0f0f0;border-radius:3px;padding:.2em 0}html body code::before,html body code::after{letter-spacing:-0.2em;content:"\00a0"}html body pre>code{padding:0;margin:0;font-size:.85em !important;word-break:normal;white-space:pre;background:transparent;border:0}html body .highlight{margin-bottom:16px}html body .highlight pre,html body pre{padding:1em;overflow:auto;font-size:.85em !important;line-height:1.45;border:#d6d6d6;border-radius:3px}html body .highlight pre{margin-bottom:0;word-break:normal}html body pre code,html body pre tt{display:inline;max-width:initial;padding:0;margin:0;overflow:initial;line-height:inherit;word-wrap:normal;background-color:transparent;border:0}html body pre code:before,html body pre tt:before,html body pre code:after,html body pre tt:after{content:normal}html body p,html body blockquote,html body ul,html body ol,html body dl,html body pre{margin-top:0;margin-bottom:16px}html body kbd{color:#000;border:1px solid #d6d6d6;border-bottom:2px solid #c7c7c7;padding:2px 4px;background-color:#f0f0f0;border-radius:3px}@media print{html body{background-color:#fff}html body h1,html body h2,html body h3,html body h4,html body h5,html body h6{color:#000;page-break-after:avoid}html body blockquote{color:#5c5c5c}html body pre{page-break-inside:avoid}html body table{display:table}html body img{display:block;max-width:100%;max-height:100%}html body pre,html body code{word-wrap:break-word;white-space:pre}}.markdown-preview{width:100%;height:100%;box-sizing:border-box}.markdown-preview .pagebreak,.markdown-preview .newpage{page-break-before:always}.markdown-preview pre.line-numbers{position:relative;padding-left:3.8em;counter-reset:linenumber}.markdown-preview pre.line-numbers>code{position:relative}.markdown-preview pre.line-numbers .line-numbers-rows{position:absolute;pointer-events:none;top:1em;font-size:100%;left:0;width:3em;letter-spacing:-1px;border-right:1px solid #999;-webkit-user-select:none;-moz-user-select:none;-ms-user-select:none;user-select:none}.markdown-preview pre.line-numbers .line-numbers-rows>span{pointer-events:none;display:block;counter-increment:linenumber}.markdown-preview pre.line-numbers .line-numbers-rows>span:before{content:counter(linenumber);color:#999;display:block;padding-right:.8em;text-align:right}.markdown-preview .mathjax-exps .MathJax_Display{text-align:center !important}.markdown-preview:not([for="preview"]) .code-chunk .btn-group{display:none}.markdown-preview:not([for="preview"]) .code-chunk .status{display:none}.markdown-preview:not([for="preview"]) .code-chunk .output-div{margin-bottom:16px}.scrollbar-style::-webkit-scrollbar{width:8px}.scrollbar-style::-webkit-scrollbar-track{border-radius:10px;background-color:transparent}.scrollbar-style::-webkit-scrollbar-thumb{border-radius:5px;background-color:rgba(150,150,150,0.66);border:4px solid rgba(150,150,150,0.66);background-clip:content-box}html body[for="html-export"]:not([data-presentation-mode]){position:relative;width:100%;height:100%;top:0;left:0;margin:0;padding:0;overflow:auto}html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{position:relative;top:0}@media screen and (min-width:914px){html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{padding:2em calc(50% - 457px)}}@media screen and (max-width:914px){html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{padding:2em}}@media screen and (max-width:450px){html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{font-size:14px !important;padding:1em}}@media print{html body[for="html-export"]:not([data-presentation-mode]) #sidebar-toc-btn{display:none}}html body[for="html-export"]:not([data-presentation-mode]) #sidebar-toc-btn{position:fixed;bottom:8px;left:8px;font-size:28px;cursor:pointer;color:inherit;z-index:99;width:32px;text-align:center;opacity:.4}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] #sidebar-toc-btn{opacity:1}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc{position:fixed;top:0;left:0;width:300px;height:100%;padding:32px 0 48px 0;font-size:14px;box-shadow:0 0 4px rgba(150,150,150,0.33);box-sizing:border-box;overflow:auto;background-color:inherit}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc::-webkit-scrollbar{width:8px}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc::-webkit-scrollbar-track{border-radius:10px;background-color:transparent}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc::-webkit-scrollbar-thumb{border-radius:5px;background-color:rgba(150,150,150,0.66);border:4px solid rgba(150,150,150,0.66);background-clip:content-box}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc a{text-decoration:none}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc ul{padding:0 1.6em;margin-top:.8em}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc li{margin-bottom:.8em}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc ul{list-style-type:none}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .markdown-preview{left:300px;width:calc(100% - 300px);padding:2em calc(50% - 457px - 150px);margin:0;box-sizing:border-box}@media screen and (max-width:1274px){html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .markdown-preview{padding:2em}}@media screen and (max-width:450px){html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .markdown-preview{width:100%}}html body[for="html-export"]:not([data-presentation-mode]):not([html-show-sidebar-toc]) .markdown-preview{left:50%;transform:translateX(-50%)}html body[for="html-export"]:not([data-presentation-mode]):not([html-show-sidebar-toc]) .md-sidebar-toc{display:none} +}html body{font-family:"Helvetica Neue",Helvetica,"Segoe UI",Arial,freesans,sans-serif;font-size:16px;line-height:1.6;color:#333;background-color:#fff;overflow:initial;box-sizing:border-box;word-wrap:break-word}html body>:first-child{margin-top:0}html body h1,html body h2,html body h3,html body h4,html body h5,html body h6{line-height:1.2;margin-top:1em;margin-bottom:16px;color:#000}html body h1{font-size:2.25em;font-weight:300;padding-bottom:.3em}html body h2{font-size:1.75em;font-weight:400;padding-bottom:.3em}html body h3{font-size:1.5em;font-weight:500}html body h4{font-size:1.25em;font-weight:600}html body h5{font-size:1.1em;font-weight:600}html body h6{font-size:1em;font-weight:600}html body h1,html body h2,html body h3,html body h4,html body h5{font-weight:600}html body h5{font-size:1em}html body h6{color:#5c5c5c}html body strong{color:#000}html body del{color:#5c5c5c}html body a:not([href]){color:inherit;text-decoration:none}html body a{color:#08c;text-decoration:none}html body a:hover{color:#00a3f5;text-decoration:none}html body img{max-width:100%}html body>p{margin-top:0;margin-bottom:16px;word-wrap:break-word}html body>ul,html body>ol{margin-bottom:16px}html body ul,html body ol{padding-left:2em}html body ul.no-list,html body ol.no-list{padding:0;list-style-type:none}html body ul ul,html body ul ol,html body ol ol,html body ol ul{margin-top:0;margin-bottom:0}html body li{margin-bottom:0}html body li.task-list-item{list-style:none}html body li>p{margin-top:0;margin-bottom:0}html body .task-list-item-checkbox{margin:0 .2em .25em -1.8em;vertical-align:middle}html body .task-list-item-checkbox:hover{cursor:pointer}html body blockquote{margin:16px 0;font-size:inherit;padding:0 15px;color:#5c5c5c;background-color:#f0f0f0;border-left:4px solid #d6d6d6}html body blockquote>:first-child{margin-top:0}html body blockquote>:last-child{margin-bottom:0}html body hr{height:4px;margin:32px 0;background-color:#d6d6d6;border:0 none}html body table{margin:10px 0 15px 0;border-collapse:collapse;border-spacing:0;display:block;width:100%;overflow:auto;word-break:normal;word-break:keep-all}html body table th{font-weight:bold;color:#000}html body table td,html body table th{border:1px solid #d6d6d6;padding:6px 13px}html body dl{padding:0}html body dl dt{padding:0;margin-top:16px;font-size:1em;font-style:italic;font-weight:bold}html body dl dd{padding:0 16px;margin-bottom:16px}html body code{font-family:Menlo,Monaco,Consolas,'Courier New',monospace;font-size:.85em !important;color:#000;background-color:#f0f0f0;border-radius:3px;padding:.2em 0}html body code::before,html body code::after{letter-spacing:-0.2em;content:"\00a0"}html body pre>code{padding:0;margin:0;font-size:.85em !important;word-break:normal;white-space:pre;background:transparent;border:0}html body .highlight{margin-bottom:16px}html body .highlight pre,html body pre{padding:1em;overflow:auto;font-size:.85em !important;line-height:1.45;border:#d6d6d6;border-radius:3px}html body .highlight pre{margin-bottom:0;word-break:normal}html body pre code,html body pre tt{display:inline;max-width:initial;padding:0;margin:0;overflow:initial;line-height:inherit;word-wrap:normal;background-color:transparent;border:0}html body pre code:before,html body pre tt:before,html body pre code:after,html body pre tt:after{content:normal}html body p,html body blockquote,html body ul,html body ol,html body dl,html body pre{margin-top:0;margin-bottom:16px}html body kbd{color:#000;border:1px solid #d6d6d6;border-bottom:2px solid #c7c7c7;padding:2px 4px;background-color:#f0f0f0;border-radius:3px}@media print{html body{background-color:#fff}html body h1,html body h2,html body h3,html body h4,html body h5,html body h6{color:#000;page-break-after:avoid}html body blockquote{color:#5c5c5c}html body pre{page-break-inside:avoid}html body table{display:table}html body img{display:block;max-width:100%;max-height:100%}html body pre,html body code{word-wrap:break-word;white-space:pre}}.markdown-preview{width:100%;height:100%;box-sizing:border-box}.markdown-preview .pagebreak,.markdown-preview .newpage{page-break-before:always}.markdown-preview pre.line-numbers{position:relative;padding-left:3.8em;counter-reset:linenumber}.markdown-preview pre.line-numbers>code{position:relative}.markdown-preview pre.line-numbers .line-numbers-rows{position:absolute;pointer-events:none;top:1em;font-size:100%;left:0;width:3em;letter-spacing:-1px;border-right:1px solid #999;-webkit-user-select:none;-moz-user-select:none;-ms-user-select:none;user-select:none}.markdown-preview pre.line-numbers .line-numbers-rows>span{pointer-events:none;display:block;counter-increment:linenumber}.markdown-preview pre.line-numbers .line-numbers-rows>span:before{content:counter(linenumber);color:#999;display:block;padding-right:.8em;text-align:right}.markdown-preview .mathjax-exps .MathJax_Display{text-align:center !important}.markdown-preview:not([for="preview"]) .code-chunk .btn-group{display:none}.markdown-preview:not([for="preview"]) .code-chunk .status{display:none}.markdown-preview:not([for="preview"]) .code-chunk .output-div{margin-bottom:16px}.scrollbar-style::-webkit-scrollbar{width:8px}.scrollbar-style::-webkit-scrollbar-track{border-radius:10px;background-color:transparent}.scrollbar-style::-webkit-scrollbar-thumb{border-radius:5px;background-color:rgba(150,150,150,0.66);border:4px solid rgba(150,150,150,0.66);background-clip:content-box}html body[for="html-export"]:not([data-presentation-mode]){position:relative;width:100%;height:100%;top:0;left:0;margin:0;padding:0;overflow:auto}html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{position:relative;top:0}@media screen and (min-width:914px){html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{padding:2em calc(50% - 457px + 2em)}}@media screen and (max-width:914px){html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{padding:2em}}@media screen and (max-width:450px){html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{font-size:14px !important;padding:1em}}@media print{html body[for="html-export"]:not([data-presentation-mode]) #sidebar-toc-btn{display:none}}html body[for="html-export"]:not([data-presentation-mode]) #sidebar-toc-btn{position:fixed;bottom:8px;left:8px;font-size:28px;cursor:pointer;color:inherit;z-index:99;width:32px;text-align:center;opacity:.4}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] #sidebar-toc-btn{opacity:1}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc{position:fixed;top:0;left:0;width:300px;height:100%;padding:32px 0 48px 0;font-size:14px;box-shadow:0 0 4px rgba(150,150,150,0.33);box-sizing:border-box;overflow:auto;background-color:inherit}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc::-webkit-scrollbar{width:8px}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc::-webkit-scrollbar-track{border-radius:10px;background-color:transparent}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc::-webkit-scrollbar-thumb{border-radius:5px;background-color:rgba(150,150,150,0.66);border:4px solid rgba(150,150,150,0.66);background-clip:content-box}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc a{text-decoration:none}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc ul{padding:0 1.6em;margin-top:.8em}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc li{margin-bottom:.8em}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc ul{list-style-type:none}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .markdown-preview{left:300px;width:calc(100% - 300px);padding:2em calc(50% - 457px - 150px);margin:0;box-sizing:border-box}@media screen and (max-width:1274px){html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .markdown-preview{padding:2em}}@media screen and (max-width:450px){html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .markdown-preview{width:100%}}html body[for="html-export"]:not([data-presentation-mode]):not([html-show-sidebar-toc]) .markdown-preview{left:50%;transform:translateX(-50%)}html body[for="html-export"]:not([data-presentation-mode]):not([html-show-sidebar-toc]) .md-sidebar-toc{display:none} /* Please visit the URL below for more information: */ /* https://shd101wyy.github.io/markdown-preview-enhanced/#/customize-css */ - + </style> </head> <body for="html-export"> - <div class="mume markdown-preview "> + <div class="mume markdown-preview "> <h1 class="mume-header" id="eclipse-scava-downloads">Eclipse Scava Downloads</h1> <p><img src="scava-header.jpg" alt="Scava logo"></p> -<p>This web site hosts the various downloads available from the <a href="https://eclipse.org/scava">Eclipse Scava project</a>. It notably includes:</p> +<p>This web site hosts the open datasets generated in the course of the <a href="https://crossminer.org">Crossminer research project</a>. Crossminer has been terminated in 2019, and since then the datasets are maintained by <a href="https://castalia.solutions">Castalia Solutions</a> as a service for the Eclipse and Research communities.</p> +<p>The datasets include various pieces of data retrieved from the Eclipse forge: Mailing lists, Project development data, and AERI stacktraces in handy CSV and JSON formats, and each dataset has a R Markdown document describing its content and providing hints about how to use it. Examples provided mainly use the <a href="https://r-project.org">R statistical analysis software</a>.</p> +<p>All datasets are published under the <a href="https://creativecommons.org/licenses/by-sa/4.0/">Creative Commons BY-Attribution-Share Alike 4.0 (International)</a>.</p> +<p>All data is anonymised, please see the <a href="datasets_privacy.html">dedicated document</a> to learn more about privacy and the anonymisation mecanism.</p> +<p>We're open: if you'd like to contribute, please see the <a href="https://gitlab.eclipse.org/bbaldassari2kd/scava-datasets">GitLab project</a> page.</p> +<h2 class="mume-header" id="eclipse-projects">Eclipse projects</h2> + +<p>We generate comprehensive data extracts of a <a href="projects/eclipse_projects.html">set of Eclipse projects</a>, including data sources like:</p> +<ul> +<li>Software Configuration Management (<a href="https://git.eclipse.org">git</a>),</li> +<li>Issues tracking (<a href="https://bugs.eclipse.org">Bugzilla</a> or GitHub),</li> +<li>Project metadata checks (<a href="https://projects.eclipse.org">PMI</a>),</li> +<li>Licencing and copyrights (<a href="https://github.com/nexB/scancode-toolkit">Scancode</a>), and</li> +<li>Static Code Analysis (<a href="https://sonarcloud.io">SonarCloud</a>) when available.</li> +</ul> +<p>These datasets are updated weekly, at 2am on Sunday. If you would like to add a project, please <a href="https://gitlab.eclipse.org/bbaldassari2kd/scava-datasets/-/issues">let us know</a>.</p> +<p><strong>Downloads</strong></p> +<ul> +<li><strong>List of projects</strong> See the <a href="projects/eclipse_projects.html">list of projects with their associated datasets and documentation</a>.</li> +</ul> +<h2 class="mume-header" id="eclipse-mailing-lists">Eclipse mailing lists</h2> + +<p>The <a href="eclipse_mls/eclipse_mls.html">Eclipse Mailing lists</a> dump is an extract of all emails posted on the Eclipse mailing lists.</p> <ul> -<li>Open <a href="datasets/index.html">software-engineering datasets</a> related to the Eclipse forge, including AERI stacktraces, Eclipse mailing lists, and Eclipse projects data.</li> -<li>Downloads for the Scava application (availability planned for Q3 2019).</li> +<li>Download the <strong>Eclipse mailing lists dataset</strong> [ <a href="eclipse_mls/eclipse_mls.gz">CSV</a> ].</li> +<li>Check the <strong>documentation</strong> for the dataset <a href="eclipse_mls/mbox_csv_analysis.html">here (HTML)</a>. For reproducibility we also provide the <a href="eclipse_mls/mbox_csv_analysis.rmd">R Markdown document</a> for the dataset analysis and documentation.</li> +<li>Download the <strong>mbox files</strong> [ <a href="eclipse_mls/eclipse_mls.html#project-mboxes">see the list</a> ]</li> </ul> -<h2 class="mume-header" id="more-information">More information</h2> +<p>More information can be found on the official <a href="https://accounts.eclipse.org/mailing-list">Eclipse page for mailing lists</a>.</p> +<h2 class="mume-header" id="aeri-stacktraces">AERI Stacktraces</h2> + +<p>The <a href="aeri_stacktraces/aeri_stacktraces.html">AERI stacktraces dataset</a> is a list of exceptions encountered by users in the Eclipse IDE, as retrieved by the AERI system. The Automated Error Reporting (AERI) system has been developed by the people at <a href="https://www.codetrails.com/">Code Trails</a> and retrieves information about exceptions. It is installed by default in the Eclipse IDE and has helped hundreds of projects better support their users and resolve bugs. This dataset is a dump of all records over a couple of years, with useful information about the exceptions and environment.</p> +<p>Last update of the dataset occured on 2018-02-11.</p> +<p><strong>Downloads</strong></p> +<ul> +<li><strong>Problems full</strong> [ <a href="aeri_stacktraces/problems_full.tar.bz2">Download JSON</a> ] -- A list of all problems, exported as JSON (one problem per file).</li> +<li><strong>Problems extract</strong> [ <a href="aeri_stacktraces/problems_extract.csv.bz2">Download CSV</a> ] -- A list of all problems, exported as CSV (one big file).</li> +<li><strong>Incidents full</strong> [ <a href="aeri_stacktraces/incidents_full.tar.bz2">Download JSON</a> ] -- A list of all incidents, exported as JSON (one incident per file).</li> +<li><strong>Incidents extract</strong> [ <a href="aeri_stacktraces/incidents_extract.csv.bz2">Download CSV</a> ] -- A list of all incidents, exported as CSV (one big file).</li> +<li><strong>Incidents Bundles</strong> [ <a href="aeri_stacktraces/incidents_bundles_extract.csv.bz2">Download CSV</a> ] -- A list of all bundles found in incidents, exported as CSV. Attributes are bundle_name, bundle_version, and number of occurrences.</li> +</ul> +<p><strong>Documentation</strong></p> +<ul> +<li><strong>Stacktraces Problems analysis document</strong> [ <a href="aeri_stacktraces/problems_analysis.pdf">Download PDF</a> | <a href="aeri_stacktraces/problems_analysis.rmd">Download Rmd</a> ] -- A R Markdown document to analyse the Stacktraces problem dataset, with description of the actual content and examples of usage.</li> +<li><strong>Stacktraces Incidents analysis document</strong> [ <a href="aeri_stacktraces/incidents_analysis.pdf">Download PDF</a> | <a href="aeri_stacktraces/incidents_analysis.rmd">Download Rmd</a> ] -- A R Markdown document to analyse the Stacktraces incidents dataset, with description of the actual content and examples of usage.</li> +</ul> +<p>More information about the AERI system can be found on the <a href="https://www.codetrails.com/error-analytics/manual/">Code Trails website</a>.</p> +<h2 class="mume-header" id="about-scava">About Scava</h2> <p>Scava is the Eclipse spin-off of Crossminer, a EU-funded research project. More information can be found at the following places:</p> <ul> <li>The <a href="https://eclipse.org/scava">Eclipse Scava project</a></li> <li>The official <a href="https://scava-docs.readthedocs.io">documentation for Scava</a></li> +<li>The <a href="https://github.com/crossminer/scava-docs">documentation repository</a></li> <li>The official <a href="https://crossminer.org">Crossminer web page</a></li> <li>The <a href="https://github.com/crossminer">GitHub Crossminer organisation</a></li> </ul> @@ -283,13 +325,6 @@ pre[data-line] .line-highlight[data-end]:after { <p>All datasets are published under the <a href="https://creativecommons.org/licenses/by-sa/4.0/">Creative Commons BY-Attribution-Share Alike 4.0 (International)</a>.</p> <p>All code is, unless otherwise stated, published under the <a href="https://www.eclipse.org/legal/epl-2.0/">Eclipse Public Licence, v2</a>.</p> -<h2 class="mume-header" id="associated-repositories">Associated repositories</h2> - -<p>More information can be found in the following places:</p> -<ul> -<li>The <a href="https://github.com/eclipse-scava/scava-datasets">git repository dedicated to the datasets extraction</a>: <code>git@github.com:eclipse-scava/scava-datasets.git</code></li> -<li>The <a href="https://github.com/crossminer/scava-docs">documentation repository</a> for the Scava project: <code>https://github.com/crossminer/scava-docs</code></li> -</ul> </div> diff --git a/docs/scava_datasets.html b/docs/scava_datasets.html deleted file mode 100644 index 9f301e1..0000000 --- a/docs/scava_datasets.html +++ /dev/null @@ -1,324 +0,0 @@ -<!DOCTYPE html><html><head> - <title>scava_datasets</title> - <meta charset="utf-8"> - <meta name="viewport" content="width=device-width, initial-scale=1.0"> - - <link rel="stylesheet" href="file:////home/boris/.atom/packages/markdown-preview-enhanced/node_modules/@shd101wyy/mume/dependencies/katex/katex.min.css"> - - - - - - - - - - - <style> - /** - * prism.js Github theme based on GitHub's theme. - * @author Sam Clarke - */ -code[class*="language-"], -pre[class*="language-"] { - color: #333; - background: none; - font-family: Consolas, "Liberation Mono", Menlo, Courier, monospace; - text-align: left; - white-space: pre; - word-spacing: normal; - word-break: normal; - word-wrap: normal; - line-height: 1.4; - - -moz-tab-size: 8; - -o-tab-size: 8; - tab-size: 8; - - -webkit-hyphens: none; - -moz-hyphens: none; - -ms-hyphens: none; - hyphens: none; -} - -/* Code blocks */ -pre[class*="language-"] { - padding: .8em; - overflow: auto; - /* border: 1px solid #ddd; */ - border-radius: 3px; - /* background: #fff; */ - background: #f5f5f5; -} - -/* Inline code */ -:not(pre) > code[class*="language-"] { - padding: .1em; - border-radius: .3em; - white-space: normal; - background: #f5f5f5; -} - -.token.comment, -.token.blockquote { - color: #969896; -} - -.token.cdata { - color: #183691; -} - -.token.doctype, -.token.punctuation, -.token.variable, -.token.macro.property { - color: #333; -} - -.token.operator, -.token.important, -.token.keyword, -.token.rule, -.token.builtin { - color: #a71d5d; -} - -.token.string, -.token.url, -.token.regex, -.token.attr-value { - color: #183691; -} - -.token.property, -.token.number, -.token.boolean, -.token.entity, -.token.atrule, -.token.constant, -.token.symbol, -.token.command, -.token.code { - color: #0086b3; -} - -.token.tag, -.token.selector, -.token.prolog { - color: #63a35c; -} - -.token.function, -.token.namespace, -.token.pseudo-element, -.token.class, -.token.class-name, -.token.pseudo-class, -.token.id, -.token.url-reference .token.variable, -.token.attr-name { - color: #795da3; -} - -.token.entity { - cursor: help; -} - -.token.title, -.token.title .token.punctuation { - font-weight: bold; - color: #1d3e81; -} - -.token.list { - color: #ed6a43; -} - -.token.inserted { - background-color: #eaffea; - color: #55a532; -} - -.token.deleted { - background-color: #ffecec; - color: #bd2c00; -} - -.token.bold { - font-weight: bold; -} - -.token.italic { - font-style: italic; -} - - -/* JSON */ -.language-json .token.property { - color: #183691; -} - -.language-markup .token.tag .token.punctuation { - color: #333; -} - -/* CSS */ -code.language-css, -.language-css .token.function { - color: #0086b3; -} - -/* YAML */ -.language-yaml .token.atrule { - color: #63a35c; -} - -code.language-yaml { - color: #183691; -} - -/* Ruby */ -.language-ruby .token.function { - color: #333; -} - -/* Markdown */ -.language-markdown .token.url { - color: #795da3; -} - -/* Makefile */ -.language-makefile .token.symbol { - color: #795da3; -} - -.language-makefile .token.variable { - color: #183691; -} - -.language-makefile .token.builtin { - color: #0086b3; -} - -/* Bash */ -.language-bash .token.keyword { - color: #0086b3; -} - -/* highlight */ -pre[data-line] { - position: relative; - padding: 1em 0 1em 3em; -} -pre[data-line] .line-highlight-wrapper { - position: absolute; - top: 0; - left: 0; - background-color: transparent; - display: block; - width: 100%; -} - -pre[data-line] .line-highlight { - position: absolute; - left: 0; - right: 0; - padding: inherit 0; - margin-top: 1em; - background: hsla(24, 20%, 50%,.08); - background: linear-gradient(to right, hsla(24, 20%, 50%,.1) 70%, hsla(24, 20%, 50%,0)); - pointer-events: none; - line-height: inherit; - white-space: pre; -} - -pre[data-line] .line-highlight:before, -pre[data-line] .line-highlight[data-end]:after { - content: attr(data-start); - position: absolute; - top: .4em; - left: .6em; - min-width: 1em; - padding: 0 .5em; - background-color: hsla(24, 20%, 50%,.4); - color: hsl(24, 20%, 95%); - font: bold 65%/1.5 sans-serif; - text-align: center; - vertical-align: .3em; - border-radius: 999px; - text-shadow: none; - box-shadow: 0 1px white; -} - -pre[data-line] .line-highlight[data-end]:after { - content: attr(data-end); - top: auto; - bottom: .4em; -}html body{font-family:"Helvetica Neue",Helvetica,"Segoe UI",Arial,freesans,sans-serif;font-size:16px;line-height:1.6;color:#333;background-color:#fff;overflow:initial;box-sizing:border-box;word-wrap:break-word}html body>:first-child{margin-top:0}html body h1,html body h2,html body h3,html body h4,html body h5,html body h6{line-height:1.2;margin-top:1em;margin-bottom:16px;color:#000}html body h1{font-size:2.25em;font-weight:300;padding-bottom:.3em}html body h2{font-size:1.75em;font-weight:400;padding-bottom:.3em}html body h3{font-size:1.5em;font-weight:500}html body h4{font-size:1.25em;font-weight:600}html body h5{font-size:1.1em;font-weight:600}html body h6{font-size:1em;font-weight:600}html body h1,html body h2,html body h3,html body h4,html body h5{font-weight:600}html body h5{font-size:1em}html body h6{color:#5c5c5c}html body strong{color:#000}html body del{color:#5c5c5c}html body a:not([href]){color:inherit;text-decoration:none}html body a{color:#08c;text-decoration:none}html body a:hover{color:#00a3f5;text-decoration:none}html body img{max-width:100%}html body>p{margin-top:0;margin-bottom:16px;word-wrap:break-word}html body>ul,html body>ol{margin-bottom:16px}html body ul,html body ol{padding-left:2em}html body ul.no-list,html body ol.no-list{padding:0;list-style-type:none}html body ul ul,html body ul ol,html body ol ol,html body ol ul{margin-top:0;margin-bottom:0}html body li{margin-bottom:0}html body li.task-list-item{list-style:none}html body li>p{margin-top:0;margin-bottom:0}html body .task-list-item-checkbox{margin:0 .2em .25em -1.8em;vertical-align:middle}html body .task-list-item-checkbox:hover{cursor:pointer}html body blockquote{margin:16px 0;font-size:inherit;padding:0 15px;color:#5c5c5c;border-left:4px solid #d6d6d6}html body blockquote>:first-child{margin-top:0}html body blockquote>:last-child{margin-bottom:0}html body hr{height:4px;margin:32px 0;background-color:#d6d6d6;border:0 none}html body table{margin:10px 0 15px 0;border-collapse:collapse;border-spacing:0;display:block;width:100%;overflow:auto;word-break:normal;word-break:keep-all}html body table th{font-weight:bold;color:#000}html body table td,html body table th{border:1px solid #d6d6d6;padding:6px 13px}html body dl{padding:0}html body dl dt{padding:0;margin-top:16px;font-size:1em;font-style:italic;font-weight:bold}html body dl dd{padding:0 16px;margin-bottom:16px}html body code{font-family:Menlo,Monaco,Consolas,'Courier New',monospace;font-size:.85em !important;color:#000;background-color:#f0f0f0;border-radius:3px;padding:.2em 0}html body code::before,html body code::after{letter-spacing:-0.2em;content:"\00a0"}html body pre>code{padding:0;margin:0;font-size:.85em !important;word-break:normal;white-space:pre;background:transparent;border:0}html body .highlight{margin-bottom:16px}html body .highlight pre,html body pre{padding:1em;overflow:auto;font-size:.85em !important;line-height:1.45;border:#d6d6d6;border-radius:3px}html body .highlight pre{margin-bottom:0;word-break:normal}html body pre code,html body pre tt{display:inline;max-width:initial;padding:0;margin:0;overflow:initial;line-height:inherit;word-wrap:normal;background-color:transparent;border:0}html body pre code:before,html body pre tt:before,html body pre code:after,html body pre tt:after{content:normal}html body p,html body blockquote,html body ul,html body ol,html body dl,html body pre{margin-top:0;margin-bottom:16px}html body kbd{color:#000;border:1px solid #d6d6d6;border-bottom:2px solid #c7c7c7;padding:2px 4px;background-color:#f0f0f0;border-radius:3px}@media print{html body{background-color:#fff}html body h1,html body h2,html body h3,html body h4,html body h5,html body h6{color:#000;page-break-after:avoid}html body blockquote{color:#5c5c5c}html body pre{page-break-inside:avoid}html body table{display:table}html body img{display:block;max-width:100%;max-height:100%}html body pre,html body code{word-wrap:break-word;white-space:pre}}.markdown-preview{width:100%;height:100%;box-sizing:border-box}.markdown-preview .pagebreak,.markdown-preview .newpage{page-break-before:always}.markdown-preview pre.line-numbers{position:relative;padding-left:3.8em;counter-reset:linenumber}.markdown-preview pre.line-numbers>code{position:relative}.markdown-preview pre.line-numbers .line-numbers-rows{position:absolute;pointer-events:none;top:1em;font-size:100%;left:0;width:3em;letter-spacing:-1px;border-right:1px solid #999;-webkit-user-select:none;-moz-user-select:none;-ms-user-select:none;user-select:none}.markdown-preview pre.line-numbers .line-numbers-rows>span{pointer-events:none;display:block;counter-increment:linenumber}.markdown-preview pre.line-numbers .line-numbers-rows>span:before{content:counter(linenumber);color:#999;display:block;padding-right:.8em;text-align:right}.markdown-preview .mathjax-exps .MathJax_Display{text-align:center !important}.markdown-preview:not([for="preview"]) .code-chunk .btn-group{display:none}.markdown-preview:not([for="preview"]) .code-chunk .status{display:none}.markdown-preview:not([for="preview"]) .code-chunk .output-div{margin-bottom:16px}.scrollbar-style::-webkit-scrollbar{width:8px}.scrollbar-style::-webkit-scrollbar-track{border-radius:10px;background-color:transparent}.scrollbar-style::-webkit-scrollbar-thumb{border-radius:5px;background-color:rgba(150,150,150,0.66);border:4px solid rgba(150,150,150,0.66);background-clip:content-box}html body[for="html-export"]:not([data-presentation-mode]){position:relative;width:100%;height:100%;top:0;left:0;margin:0;padding:0;overflow:auto}html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{position:relative;top:0}@media screen and (min-width:914px){html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{padding:2em calc(50% - 457px)}}@media screen and (max-width:914px){html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{padding:2em}}@media screen and (max-width:450px){html body[for="html-export"]:not([data-presentation-mode]) .markdown-preview{font-size:14px !important;padding:1em}}@media print{html body[for="html-export"]:not([data-presentation-mode]) #sidebar-toc-btn{display:none}}html body[for="html-export"]:not([data-presentation-mode]) #sidebar-toc-btn{position:fixed;bottom:8px;left:8px;font-size:28px;cursor:pointer;color:inherit;z-index:99;width:32px;text-align:center;opacity:.4}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] #sidebar-toc-btn{opacity:1}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc{position:fixed;top:0;left:0;width:300px;height:100%;padding:32px 0 48px 0;font-size:14px;box-shadow:0 0 4px rgba(150,150,150,0.33);box-sizing:border-box;overflow:auto;background-color:inherit}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc::-webkit-scrollbar{width:8px}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc::-webkit-scrollbar-track{border-radius:10px;background-color:transparent}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc::-webkit-scrollbar-thumb{border-radius:5px;background-color:rgba(150,150,150,0.66);border:4px solid rgba(150,150,150,0.66);background-clip:content-box}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc a{text-decoration:none}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc ul{padding:0 1.6em;margin-top:.8em}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc li{margin-bottom:.8em}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .md-sidebar-toc ul{list-style-type:none}html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .markdown-preview{left:300px;width:calc(100% - 300px);padding:2em calc(50% - 457px - 150px);margin:0;box-sizing:border-box}@media screen and (max-width:1274px){html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .markdown-preview{padding:2em}}@media screen and (max-width:450px){html body[for="html-export"]:not([data-presentation-mode])[html-show-sidebar-toc] .markdown-preview{width:100%}}html body[for="html-export"]:not([data-presentation-mode]):not([html-show-sidebar-toc]) .markdown-preview{left:50%;transform:translateX(-50%)}html body[for="html-export"]:not([data-presentation-mode]):not([html-show-sidebar-toc]) .md-sidebar-toc{display:none} -/* Please visit the URL below for more information: */ -/* https://shd101wyy.github.io/markdown-preview-enhanced/#/customize-css */ - - </style> - </head> - <body for="html-export"> - <div class="mume markdown-preview "> - <h1 class="mume-header" id="eclipse-scava-datasets">Eclipse Scava Datasets</h1> - -<p>This web site hosts the open datasets generated in the course of the Crossminer research project. It includes various pieces of data retrieved from the Eclipse forge in CSV and JSON formats, and each dataset has a R Markdown document describing its content and providing hints about how to use it. Examples provided mainly use the <a href="https://r-project.org">R statistical analysis software</a>.</p> -<p>All datasets are published under the <a href="https://creativecommons.org/licenses/by-sa/4.0/">Creative Commons BY-Attribution-Share Alike 4.0 (International)</a>.</p> -<p>All data is anonymised, please see the <a href="../docs/datasets_privacy.html">dedicated document</a> to learn more about privacy and the anonymisation mecanism.</p> -<h2 class="mume-header" id="eclipse-projects">Eclipse projects</h2> - -<p>We generate full data extracts of a <a href="projects/eclipse_projects.html">set of Eclipse projects</a>, including data sources like:</p> -<ul> -<li>SCM (<a href="https://git.eclipse.org">git</a>),</li> -<li>Issues tracking (<a href="https://bugs.eclipse.org">Bugzilla</a>),</li> -<li><a href="https://projects.eclipse.org">PMI</a> checks,</li> -<li>Static Code Analysis (<a href="https://sonar.eclipse.org">SonarQube</a>).</li> -</ul> -<p>These datasets are updated weekly, at 2am on Sunday.</p> -<p><strong>Downloads</strong></p> -<ul> -<li><strong>List of projects</strong> See the <a href="projects/eclipse_projects.html">list of projects with their associated datasets and documentation</a>.</li> -</ul> -<h2 class="mume-header" id="aeri-stacktraces">AERI Stacktraces</h2> - -<p>The <a href="aeri_stacktraces/aeri_stacktraces.html">AERI stacktraces dataset</a> is a list of exceptions encountered by users in the Eclipse IDE, as retrieved by the AERI system. The Automated Error Reporting (AERI) system has been developed by the people at <a href="https://www.codetrails.com/">Code Trails</a> and retrieves information about exceptions. It is installed by default in the Eclipse IDE and has helped hundreds of projects better support their users and resolve bugs. This dataset is a dump of all records over a couple of years, with useful information about the exceptions and environment.</p> -<p>Last update of the dataset occured on 2018-02-11.</p> -<p><strong>Downloads</strong></p> -<ul> -<li><strong>Problems full</strong> [ <a href="aeri_stacktraces/problems_full.tar.bz2">Download JSON</a> ] -- A list of all problems, exported as JSON (one problem per file).</li> -<li><strong>Problems extract</strong> [ <a href="aeri_stacktraces/problems_extract.csv.bz2">Download CSV</a> ] -- A list of all problems, exported as CSV (one big file).</li> -<li><strong>Incidents full</strong> [ <a href="aeri_stacktraces/incidents_full.tar.bz2">Download JSON</a> ] -- A list of all incidents, exported as JSON (one incident per file).</li> -<li><strong>Incidents extract</strong> [ <a href="aeri_stacktraces/incidents_extract.csv.bz2">Download CSV</a> ] -- A list of all incidents, exported as CSV (one big file).</li> -<li><strong>Incidents Bundles</strong> [ <a href="aeri_stacktraces/incidents_bundles_extract.csv.bz2">Download CSV</a> ] -- A list of all bundles found in incidents, exported as CSV. Attributes are bundle_name, bundle_version, and number of occurrences.</li> -</ul> -<p><strong>Documentation</strong></p> -<ul> -<li><strong>Stacktraces Problems analysis document</strong> [ <a href="aeri_stacktraces/problems_analysis.pdf">Download PDF</a> | <a href="aeri_stacktraces/problems_analysis.rmd">Download Rmd</a> ] -- A R Markdown document to analyse the Stacktraces problem dataset, with description of the actual content and examples of usage.</li> -<li><strong>Stacktraces Incidents analysis document</strong> [ <a href="aeri_stacktraces/incidents_analysis.pdf">Download PDF</a> | <a href="aeri_stacktraces/incidents_analysis.rmd">Download Rmd</a> ] -- A R Markdown document to analyse the Stacktraces incidents dataset, with description of the actual content and examples of usage.</li> -</ul> -<p>More information about the AERI system can be found on the <a href="https://www.codetrails.com/error-analytics/manual/">Code Trails website</a>.</p> -<h2 class="mume-header" id="eclipse-mailing-lists">Eclipse mailing lists</h2> - -<p>The <a href="eclipse_mls/eclipse_mls.html">Eclipse Mailing lists</a> dump is an extract of all emails posted on the Eclipse mailing lists.</p> -<ul> -<li>Download the <strong>Eclipse mailing lists dataset</strong> [ <a href="eclipse_mls/eclipse_mls.gz">CSV</a> ].</li> -<li>Check the <strong>documentation</strong> for the dataset <a href="eclipse_mls/mbox_csv_analysis.html">here (HTML)</a>. For reproducibility we also provide the <a href="eclipse_mls/mbox_csv_analysis.rmd">R Markdown document</a> for the dataset analysis and documentation.</li> -<li>Download the <strong>mbox files</strong> [ <a href="eclipse_mls/eclipse_mls.html#project-mboxes">see the list</a> ]</li> -</ul> -<p>More information can be found on the official <a href="https://accounts.eclipse.org/mailing-list">Eclipse page for mailing lists</a>.</p> - - </div> - - - - - - - - - - - - </body></html> \ No newline at end of file diff --git a/docs/scava_datasets.md b/docs/scava_datasets.md deleted file mode 100644 index 7849f4a..0000000 --- a/docs/scava_datasets.md +++ /dev/null @@ -1,57 +0,0 @@ - -# Eclipse Scava Datasets - -This web site hosts the open datasets generated in the course of the Crossminer research project. It includes various pieces of data retrieved from the Eclipse forge in CSV and JSON formats, and each dataset has a R Markdown document describing its content and providing hints about how to use it. Examples provided mainly use the [R statistical analysis software](https://r-project.org). - -All datasets are published under the [Creative Commons BY-Attribution-Share Alike 4.0 (International)](https://creativecommons.org/licenses/by-sa/4.0/). - -All data is anonymised, please see the [dedicated document](../docs/datasets_privacy.html) to learn more about privacy and the anonymisation mecanism. - - -## Eclipse projects - -We generate full data extracts of a [set of Eclipse projects](projects/eclipse_projects.html), including data sources like: - -* SCM ([git](https://git.eclipse.org)), -* Issues tracking ([Bugzilla](https://bugs.eclipse.org)), -* [PMI](https://projects.eclipse.org) checks, -* Static Code Analysis ([SonarQube](https://sonar.eclipse.org)). - -These datasets are updated weekly, at 2am on Sunday. - -**Downloads** - -* **List of projects** See the [list of projects with their associated datasets and documentation](projects/eclipse_projects.html). - - -## AERI Stacktraces - -The [AERI stacktraces dataset](aeri_stacktraces/aeri_stacktraces.html) is a list of exceptions encountered by users in the Eclipse IDE, as retrieved by the AERI system. The Automated Error Reporting (AERI) system has been developed by the people at [Code Trails](https://www.codetrails.com/) and retrieves information about exceptions. It is installed by default in the Eclipse IDE and has helped hundreds of projects better support their users and resolve bugs. This dataset is a dump of all records over a couple of years, with useful information about the exceptions and environment. - -Last update of the dataset occured on 2018-02-11. - -**Downloads** - -* **Problems full** [ [Download JSON](aeri_stacktraces/problems_full.tar.bz2) ] -- A list of all problems, exported as JSON (one problem per file). -* **Problems extract** [ [Download CSV](aeri_stacktraces/problems_extract.csv.bz2) ] -- A list of all problems, exported as CSV (one big file). -* **Incidents full** [ [Download JSON](aeri_stacktraces/incidents_full.tar.bz2) ] -- A list of all incidents, exported as JSON (one incident per file). -* **Incidents extract** [ [Download CSV](aeri_stacktraces/incidents_extract.csv.bz2) ] -- A list of all incidents, exported as CSV (one big file). -* **Incidents Bundles** [ [Download CSV](aeri_stacktraces/incidents_bundles_extract.csv.bz2) ] -- A list of all bundles found in incidents, exported as CSV. Attributes are bundle_name, bundle_version, and number of occurrences. - -**Documentation** - -* **Stacktraces Problems analysis document** [ [Download PDF](aeri_stacktraces/problems_analysis.pdf) | [Download Rmd](aeri_stacktraces/problems_analysis.rmd) ] -- A R Markdown document to analyse the Stacktraces problem dataset, with description of the actual content and examples of usage. -* **Stacktraces Incidents analysis document** [ [Download PDF](aeri_stacktraces/incidents_analysis.pdf) | [Download Rmd](aeri_stacktraces/incidents_analysis.rmd) ] -- A R Markdown document to analyse the Stacktraces incidents dataset, with description of the actual content and examples of usage. - -More information about the AERI system can be found on the [Code Trails website](https://www.codetrails.com/error-analytics/manual/). - - -## Eclipse mailing lists - -The [Eclipse Mailing lists](eclipse_mls/eclipse_mls.html) dump is an extract of all emails posted on the Eclipse mailing lists. - -* Download the **Eclipse mailing lists dataset** [ [CSV](eclipse_mls/eclipse_mls.gz) ]. -* Check the **documentation** for the dataset [here (HTML)](eclipse_mls/mbox_csv_analysis.html). For reproducibility we also provide the [R Markdown document](eclipse_mls/mbox_csv_analysis.rmd) for the dataset analysis and documentation. -* Download the **mbox files** [ [see the list](eclipse_mls/eclipse_mls.html#project-mboxes) ] - -More information can be found on the official [Eclipse page for mailing lists](https://accounts.eclipse.org/mailing-list). -- GitLab