## recommended corpus configuration file for use of Sketch Engine ## fill path to corpus in the fields PATH,VERTICAL and WSDEF DOCSTRUCTURE "doc" ENCODING "UTF-8" LANGUAGE "Sanskrit (romanised)" LPOSLIST "" NAME "Newton_Segmented_Sanskrit" NOLETTERCASE "1" PATH "FILL WITH PATH TO CORPUS" TAGSETDOC "" VERTICAL "| ca_getvertical 'FILL WITH PATH TO CORPUS' 'doc'" WPOSLIST "" ATTRIBUTE "word" { } ATTRIBUTE "lc" { ARG1 "C" DYNAMIC "utf8lowercase" DYNLIB "internal" DYNTYPE "index" FROMATTR "word" FUNTYPE "s" LABEL "word (lowercase)" TRANSQUERY "yes" } STRUCTURE "s" { DEFAULTLOCALE "C" ENCODING "UTF-8" LANGUAGE "" NESTED "" ATTRIBUTE "number" { DYNTYPE "index" ENCODING "UTF-8" LOCALE "C" MULTISEP "," MULTIVALUE "n" TYPE "MD_MI" } } STRUCTURE "page" { DEFAULTLOCALE "C" ENCODING "UTF-8" LANGUAGE "" NESTED "" ATTRIBUTE "number" { DYNTYPE "index" ENCODING "UTF-8" LOCALE "C" MULTISEP "," MULTIVALUE "n" TYPE "MD_MI" } } STRUCTURE "doc" { DEFAULTLOCALE "C" ENCODING "UTF-8" LANGUAGE "" NESTED "" ATTRIBUTE "id" { DYNTYPE "index" ENCODING "UTF-8" LABEL "File ID" LOCALE "C" MULTISEP "," MULTIVALUE "n" TYPE "MD_MI" UNIQUE "1" } ATTRIBUTE "title" { DYNTYPE "index" ENCODING "UTF-8" LOCALE "C" MULTISEP "," MULTIVALUE "n" TYPE "MD_MI" } ATTRIBUTE "genre" { DYNTYPE "index" ENCODING "UTF-8" LOCALE "C" MULTISEP "," MULTIVALUE "n" TYPE "MD_MI" } ATTRIBUTE "author" { DYNTYPE "index" ENCODING "UTF-8" LOCALE "C" MULTISEP "," MULTIVALUE "n" TYPE "MD_MI" } ATTRIBUTE "tradition" { DYNTYPE "index" ENCODING "UTF-8" LOCALE "C" MULTISEP "," MULTIVALUE "n" TYPE "MD_MI" } ATTRIBUTE "discourse" { DYNTYPE "index" ENCODING "UTF-8" LOCALE "C" MULTISEP "," MULTIVALUE "n" TYPE "MD_MI" } ATTRIBUTE "period" { DYNTYPE "index" ENCODING "UTF-8" LOCALE "C" MULTISEP "," MULTIVALUE "n" TYPE "MD_MI" } ATTRIBUTE "religion" { DYNTYPE "index" ENCODING "UTF-8" LOCALE "C" MULTISEP "," MULTIVALUE "n" TYPE "MD_MI" } } WSBASE "" WSTHES "" WSMINHITS "" WSDEF "FILL WITH PATH TO CORPUS" TERMDEF "" TERMBASE "none"