<resource xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://datacite.org/schema/kernel-4" xsi:schemaLocation="http://datacite.org/schema/kernel-4 http://schema.datacite.org/meta/kernel-4.1/metadata.xsd"><identifier identifierType="Handle">21.15109/CONCORDA/XTVX3U</identifier><creators><creator><creatorName nameType="Personal">Kalivoda, Ágnes</creatorName><givenName>Ágnes</givenName><familyName>Kalivoda</familyName><nameIdentifier nameIdentifierScheme="ORCID">0000-0003-2520-5523</nameIdentifier><affiliation>Nyelvtudományi Kutatóközpont</affiliation></creator></creators><titles><title>PrevDistro</title><title titleType="Subtitle">Preverb Distributions</title></titles><publisher>ARP</publisher><publicationYear>2021</publicationYear><subjects><subject>Arts and Humanities</subject><subject>linguistics</subject><subject>Hungarian language</subject><subject>preverb constructions</subject></subjects><contributors><contributor contributorType="ContactPerson"><contributorName nameType="Personal">Kalivoda, Ágnes</contributorName><givenName>Ágnes</givenName><familyName>Kalivoda</familyName><affiliation>Nyelvtudományi Kutatóközpont</affiliation></contributor></contributors><dates><date dateType="Submitted">2021-06-21</date><date dateType="Updated">2025-11-24</date></dates><resourceType resourceTypeGeneral="Dataset">corpus data</resourceType><alternateIdentifiers><alternateIdentifier alternateIdentifierType="DOI">10.5158/ARP/XTVX3U</alternateIdentifier></alternateIdentifiers><sizes><size>11463972539</size></sizes><formats><format>text/tsv</format></formats><version>2.1</version><rightsList><rights rightsURI="info:eu-repo/semantics/openAccess"/><rights/></rightsList><descriptions><description descriptionType="Abstract">PrevDistro (Preverb Distributions) is an open-source dataset containing 41.5 million corpus occurrences of 49 preverb-verb construction types. It consists of 10 columns which are as follows:</description><description descriptionType="Abstract">1st: ID</description><description descriptionType="Abstract">2nd: construction type</description><description descriptionType="Abstract">3rd: construction subtype</description><description descriptionType="Abstract">4th: preverb position</description><description descriptionType="Abstract">5th: preverb</description><description descriptionType="Abstract">6th: verb lemma</description><description descriptionType="Abstract">7th: intervening words (as lemmas)</description><description descriptionType="Abstract">8th: actual form</description><description descriptionType="Abstract">9th: document ID</description><description descriptionType="Abstract">10th: actual sentence from the Hungarian Gigaword Corpus, the actual form (KWIC) stands between &lt; ... ></description></descriptions><geoLocations/></resource>