<!DOCTYPE html>
<!--
Copyright (C) 2025 twagoo

This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.

This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with this program.  If not, see <http://www.gnu.org/licenses/>.
-->
<html>
    <head> 
        <title>CLARIN Tool Portal</title> 
        <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
        <meta name="viewport" content="width=device-width, initial-scale=1" />
        <link rel="icon" href="data:," />
        <link href="/webjars/font-awesome/7.2.0/css/fontawesome.css" rel="stylesheet" />
        <link href="/webjars/font-awesome/7.2.0/css/solid.css" rel="stylesheet" />
        <link href="/webjars/bootstrap/5.3.8/css/bootstrap.min.css" rel="stylesheet" />
        <link href="/css/style.css" rel="stylesheet" />
        <script src="/webjars/bootstrap/5.3.8/js/bootstrap.bundle.min.js" defer></script>
        <script src="/webjars/htmx.org/2.0.10/dist/htmx.min.js" defer></script>
        <script src="/webjars/alpinejs/3.15.11/dist/cdn.min.js" defer></script>
        
<script type="text/javascript" src="//script.crazyegg.com/pages/scripts/0132/2204.js" async="async" ></script>


<script type="text/javascript">
    document.addEventListener("DOMContentLoaded", function () {
        const
                MODAL_SHOW_INTERVAL_MS = 60 * 60 * 1000, //do not show modal more than once per hour
                MODAL_ID = '#testInfoModal',
                STORAGE_PROP = 'testInfoModalShown',
                now = new Date(),
                isHomePage = (document.getElementById('homePageMain') !== null);

        var showTestInfoModal = true;
        if (localStorage) {
            const lastShown = localStorage.getItem(STORAGE_PROP);
            if (lastShown !== null) {
                if (!isHomePage) {
                    //show only if on home page unless never shown before
                    showTestInfoModal = false;
                } else if ((now - Date.parse(lastShown)) < MODAL_SHOW_INTERVAL_MS) {
                    //don't show modal if already shown recently
                    console.log('Not showing info modal, already shown on/at', lastShown);
                    showTestInfoModal = false;
                }
            }
        }

        if (showTestInfoModal) {
            const modal = new bootstrap.Modal(MODAL_ID);
            modal.show();
            if (localStorage) {
                localStorage.setItem(STORAGE_PROP, now);
            }
        }
    });
</script>


    </head>

    <body>
        <div class="container-xl">

            <nav class="navbar navbar-expand-lg bg-body-tertiary">
            <div class="container-fluid">
                <a class="navbar-brand" href="/">CLARIN Tool Portal <span class="fs-6 text-danger">prototype</span></a>
                <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbarSupportedContent" aria-controls="navbarSupportedContent" aria-expanded="false" aria-label="Toggle navigation">
                    <span class="navbar-toggler-icon"></span>
                </button>
                <div class="collapse navbar-collapse" id="navbarSupportedContent">
                    <ul class="navbar-nav me-auto mb-2 mb-lg-0">
                        <li class="nav-item">
            <a class="nav-link active" 
               aria-current="page" 
               href="/search">Search</a>
        </li>
                        <!--                        <li th:replace="~{::top-navigation-item('contributors','/contributors',${current})}">
                                                    [Contributors]
                                                </li>-->
                        <li class="nav-item">
            <a class="nav-link" 
               href="/help">Help</a>
        </li>
                    </ul>
                </div>
            </div>
        </nav>

            <main>


                <div class="mt-3">
                    <form action="/search">
                        <div class="d-flex">
                            <div class="ms-auto w-50 p-2">
                                <input type="search" class="form-control"
                                       name="q" value="" />
                                
                            </div>
                            <div class="p-2">
                                <input type="submit" class="btn btn-primary"
                                       value="Search" />
                            </div>
                        </div>
                    </form>
                </div>

                <nav aria-label="breadcrumb">
                    <ol class="breadcrumb">
                        <li class="breadcrumb-item"><a href="/">Home</a></li>
                        <li class="breadcrumb-item"><a href="/search?q=&amp;fq=dataProvider:CSD%20Tools">Search</a></li>
                        <li class="breadcrumb-item active" aria-current="page">Record</li>
                    </ol>
                </nav>

                <div class="container-md">
                    <div class="row mt-md-2">
                        <div class="col-md-8">
                            <h1>Corpus Studio Web</h1>
                        </div>

                        <div class="col-md-4">
                            <div class="mt-2 mb-2">
                                
                            </div>
                        </div>
                    </div>

                    <div class="row">
                        <div class="col-md-8">

                            <div>

        <ul id="mainContentTabsNav" class="nav nav-underline border-bottom" 
            hx-boost="true"
            hx-target="#recordTabsContent"
            hx-swap="innerHTML show:none">

            <li class="nav-item">
        <a class="nav-link active"
           hx-select-oob="#mainContentTabsNav"
           aria-current="page"
           href="/records/CSD_32_Tools_47_CorpusStudio.cmdi.xml"
           hx-select="#recordOverview">Overview</a>



            <li class="nav-item">
        <a class="nav-link"
           hx-select-oob="#mainContentTabsNav"
           href="/records/CSD_32_Tools_47_CorpusStudio.cmdi.xml/metadata"
           hx-select="#recordAllMetadata">Detailed metadata</a>



            <li class="nav-item">
        <a class="nav-link"
           hx-select-oob="#mainContentTabsNav"
           href="/records/CSD_32_Tools_47_CorpusStudio.cmdi.xml/links"
           hx-select="#recordLinks">Links</a>


        </ul>

        <div id="recordTabsContent" class="pt-2">

            

            

            <div>
                <div class="pt-2" id="recordOverview">
                <div class="mb-2" >
                    <p>Summary

CorpusStudio is a web application that facilitates in-depth quantitative syntactic research for linguists.
Background

CorpusStudio is a web application that facilitates in-depth quantitative syntactic research for linguists. It does so by supporting researchers in writing queries that operate on syntactically parsed text corpora in a number of major xml formats. Queries that belong together are kept in xml documents that are called ‘Corpus Research Projects’ (CRPs). These documents contain the queries, the order in which they are to be executed, meta-information about the queries and the project as a whole, as well as a specification of the input used for the project. The use of CRPs helps improve the replicability of corpus research.

Access

Any CLARIN-NL user can access the CorpusStudio web application and make use of the &#39;standard&#39; corpora. New users must provide a login name and password, after which they can make use of the application.

Adaptable

The CorpusStudio code is open-source. Users can take the code, adapt it and use it for their own purposes. Users can also take the code from GitHub as it is, but build their own server in order to run the application on their own text-corpora. User documentation and an API are available (see below). The current version of CorpusStudio supports xml text corpora in the FoLiA and Psdx formats. Extensions to other xml formats are possible.

CrpxProcessor provides the basic functionality and is on github on   https://github.com/ErwinKomen/CrpxProcessor. CrppServer takes care of /crpp and uses CrpxProcessor. It is on GitHub on https://github.com/ErwinKomen/CrppServer. CrpStudio  is on https://github.com/ErwinKomen/CrpStudio, takes care of /crpstudio and uses CrpxProcessor.


Main features

    Keep all important aspects of a research project in one file
    Define one or more search queries in a hierarchy
    Uses w3c developed Xquery and Xpath
    Integrated CorpusStudio-specific Xquery functions
    User-definable functions and variables
    Create corpus result databases with user-definable features accompanying each hit
    Divide the output into calculatable categories
    Divide the results into meta-data-dependent groups
    Parallel processing yields a speed-up of a factor 20-100 compared to the Windows version
    Compatibility with the Windows programs &quot;Cesax&quot; and &quot;CorpusStudio&quot;

Limitations and future developments

Current limitations to the program include: working with result database, restricted login system, no document view, grouping is restricted to system-defined groups, no query or project wizard. Although the CLARIN-NL project has stopped in December 2015, every effort will be undertaken to make sure that a number of essential features are going to be added.</p>
                </div>
                <div class="mb-2" >
                    <p>Komen, E. R. 2017. Beyond Counting Syntactic Hits. In: Odijk, J and van Hessen, A. (eds.) CLARIN in the Low Countries, Pp. 259–268. London: Ubiquity Press. DOI: https://doi.org/10.5334/bbi.21. License: CC-BY 4.0</p>
                </div>
                <div class="mb-2" >
                    <p>Komen, Erwin R. 2011. Coreferenced corpora for information structure research. In Outposts of Historical Corpus Linguistics: From the Helsinki Corpus to a Proliferation of Resources. (Studies in Variation, Contacts and Change in English 10) Jukka Tyrkkö, Terttu Nevalainen, Matti Rissanen &amp; Matti Kilpiö (eds). Helsinki, Finland: Research Unit for Variation, Contacts, and Change in English.</p>
                </div>
                <div class="mb-2" >
                    <p>Komen, Erwin R. 2013. Finding focus: a study of the historical development of focus in English. Utrecht: LOT.</p>
                </div>
                <div class="mb-2" >
                    <p>Komen, Erwin R. 2013. Corpus databases with feature pre-calculation. In Proceedings of the twelfth workshop on treebanks and linguistic theories (TLT12). Sandra Kübler, Petya Osenova &amp; Martin Volk (eds), 85-96. Sofia, Bulgaria: The institute of information and communication technologies, Bulgarian academy of sciences.</p>
                </div>
            </div>
            </div>
        </div>
    </div>

                        </div>
                        <div class="col-md-4">

                            <div class="me-2">
                                <div class="mb-2">
                                    
                                </div>
                                <div class="mb-2">
                                    
                                        <strong>Organisation:</strong><br />
                                        <ul class="list-group list-group-flush">
                                            <li class="list-group-item">Utrecht University</li>
                                            <li class="list-group-item">KU Leuven</li>
                                        </ul>
                                    
                                </div>
                                <div class="mb-2">
                                    
                                </div>
                            </div>

                            <div class="mt-2 mb-2">
                                <h2 class="h5">Resources:</h2>
                                <div class="card mb-2">
                                    <div class="card-body">
                                        <h3 class="h5 card-title">Resource</h3>
                                        <div class="h6 card-subtitle mb-2 text-body-secondary">text/csv</div>
                                        
                                        <div>
                                            <a class="btn btn-outline-secondary btn-sm" href="http://hdl.handle.net/21.11114/COLL-0000-000B-C287-1">
                                                <i class="fa-solid fa-cloud-arrow-down"></i>
                                                Access
                                            </a>
                                        </div>
                                    </div>
                                </div>
                            </div>
                        </div>
                    </div>
                </div>
            </main>

            
            <footer class="row row-cols-1 row-cols-md-3 py-4 my-5 text-bg-light">
                <div class="col mb-3">
                    <p class="text-body-secondary"><a href="/help">About</a></p>
                    <p class="text-body-secondary">vdevelop</p>
                </div>
                <div class="col mb-3 text-md-center">
                    <p>Service provided by <a href="https://www.clarin.eu">CLARIN</a></p>
                    <p class="text-body-secondary">
                        <span class="text-light footer-hidden-info">
                            built: 2026-05-11T09:06:08Z; revision: 22efec9
                        </span>
                    </p>
                </div>
                <div class="col mb-3 text-md-end">
                    <p><a href="mailto:toolportal@clarin.eu">Contact</a></p>
                </div>
            </footer>
            

<div id="testInfoModal" class="modal" tabindex="-1">
  <div class="modal-dialog">
    <div class="modal-content">
      <div class="modal-header">
        <h5 class="modal-title">Session recording</h5>
      </div>
      <div class="modal-body">
        <p>
            The version of the Tool Portal that you are currently using
            is <strong>recording the behaviour of its user for testing purposes.</strong>
            By pressing "Continue" below, you agree to the recording of your
            actions while using this site. If you do not wish to agree to this,
            please navigate away from this site.
        </p>
      </div>
      <div class="modal-footer">
        <button type="button" class="btn btn-primary" data-bs-dismiss="modal">Continue</button>
        <a class="btn btn-secondary" href="https://www.clarin.eu">Leave</a>
      </div>
    </div>
  </div>
</div>


        

        </div>
    </body>
</html>
