diff --git a/buhd/bku-details.html b/buhd/bku-details.html new file mode 100644 index 000000000..99d0f6864 --- /dev/null +++ b/buhd/bku-details.html @@ -0,0 +1,500 @@ +/* + + + + + + + + +*/ + + + + + +var charDetails = { + + +// MAIN BLOCK + +// Use _tools/generate_details_page_stubs.html to generate stubs to go here + +'\u{1740}': ` +

+

ʔa independent vowel.

+

ᝀᝊ

+

ᝀᝊᝓᝑ

+`, + + + + + +'\u{1741}': ` +

+

ʔi independent vowel.

+

ᝁᝇᝓ

+

ᝁᝌ

+ +

ʔe independent vowel.

+

+

+`, + + + + + +'\u{1742}': ` +

+

ʔo independent vowel.

+

ᝄᝓᝂ

+ +

ʔu independent vowel.

+

ᝂᝇᝓ

+

+`, + + + + + +'\u{1743}': ` +

+

k consonant with inherent vowel a.

+

ᝃᝏ

+

ᝃᝓᝃᝓ

+

+ +

x is possible when word-medial before a vowel.

+

ᝃᝃᝒᝆ

+ +`, + + + + + +'\u{1744}': ` +

+

ɡ consonant with inherent vowel a.

+

ᝄᝉ

+

ᝄᝓᝂ

+

+ +

ɣ is possible when word-medial before a vowel.

+

ᝀᝄᝓ

+ +`, + + + + + +'\u{1745}': ` +

+

ŋ consonant with inherent vowel a.

+

ᝅᝅ

+

ᝅᝒfo

+

+`, + + + + + +'\u{1746}': ` +

+

t consonant with inherent vowel a.

+

ᝆᝊᝓ

+

ᝎᝓᝆᝓ

+

+`, + + + + + +'\u{1747}': ` +

+

d consonant with inherent vowel a.

+

ᝇᝄ

+

ᝇᝓᝏ

+

+`, + + + + + +'\u{1748}': ` +

+

n consonant with inherent vowel a.

+

ᝈᝋᝓ

+

ᝈᝓᝋᝍᝓ

+

+`, + + + + + +'\u{1749}': ` +

+

p consonant with inherent vowel a. In onsets it generally only occurs in loan wordsbm.

+

ᝉᝃᝓ

+

ᝊᝉ

+

+ +

f (?) Evidence needed IPA transcriptions of Buhid words by Barhammb show frequent use of f. Taking the lead from the representation of this sound by p in the Latin orthography and from its representation in the Baybayin script, it is assumed here that the Buhid letter to use for that sound is this one.

+

ᝉᝉ

+

ᝅᝒᝉᝓ

+

+ +`, + + + + + +'\u{174A}': ` +

+

b consonant with inherent vowel a.

+

ᝊᝄᝓ

+

ᝊᝓᝂ

+

+`, + + + + + +'\u{174B}': ` +

+

m consonant with inherent vowel a.

+

ᝋᝆᝒ

+

ᝋᝒᝊᝓᝎᝓ

+

ᝋᝓᝌᝓ

+`, + + + + + +'\u{174C}': ` +

+

j consonant with inherent vowel a.

+

ᝌᝊ

+

+

ᝐᝒᝌᝓ

+`, + + + + + +'\u{174D}': ` +

+

r consonant with inherent vowel a.

+

ᝍᝒᝍᝓ

+

ᝈᝓᝋᝍᝓ

+

+`, + + + + + +'\u{174E}': ` +

+

l consonant with inherent vowel a.

+

ᝎᝊᝓ

+

ᝈᝎᝒ

+

ᝎᝓᝆᝓ

+`, + + + + + +'\u{174F}': ` +

+

w consonant with inherent vowel a.

+

ᝏᝐ

+

ᝄᝎᝏᝒ

+

+`, + + + + + +'\u{1750}': ` +

+

s consonant with inherent vowel a.

+

ᝐᝊ

+

ᝐᝒᝑᝒ

+

ᝐᝓᝎ

+`, + + + + + +'\u{1751}': ` +

+

h consonant with inherent vowel a.

+

ᝑᝆ

+

ᝐᝒᝑᝒ

+

ᝑᝓᝋᝒ

+`, + + + + + +'\u{1752}': ` +

+

i e dependent vowel.

+

ᝐᝒᝆ

+

ᝍᝒᝍᝓ

+

ᝈᝎᝒ

+

ᝋᝋᝒᝄᝓ

+ +

Nominally, this is a horizontal line that looks the same as the dependent vowel o u but appears above the base. In fact, although it always appears higher than the latter, the way it connects with the base varies from consonant to consonant.

+`, + + + + + +'\u{1753}': ` +

+

o u dependent vowel.

+

ᝊᝓ

+

ᝍᝒᝍᝓ

+

ᝎᝓᝆᝓ

+

ᝐᝓᝑᝓ

+ +

Nominally, this is a horizontal line that looks the same as the dependent vowel i e but appears below the base. In fact, although it always appears lower than the latter, the way it connects with the base varies from consonant to consonant.

+`, + + + + + + + + + + + + +// HANUNOO PUNCTUATION + + +'\u{1735}': ` +

+ +

Used as a comma, or as a verse splitter in poetry.

+

See also 1736.

+`, + + + + + +'\u{1736}': ` +

+ +

Used as a full stop, or paragraph stop.

+

See also 1735.

+`, + + + + + + + + + + + + + +// COMMON PUNCTUATION + + +// § +'\u{00A7}': ` +

§

+`, + + + + +// « +'\u{00AB}': ` +

«

+`, + + + + +// » +'\u{00BB}': ` +

»

+`, + + + + +// danda +'\u{0964}': ` +

+`, + + + + +// double danda +'\u{0965}': ` +

+`, + + + + +// – +'\u{2010}': ` +

+`, + + + + +// – +'\u{2013}': ` +

+`, + + + + +// — +'\u{2014}': ` +

+`, + + + + +// '.. +'\u{2018}': ` +

+`, + + + + +// ..' +'\u{2019}': ` +

+`, + + + + +// ".. +'\u{201C}': ` +

+`, + + + + +// .." +'\u{201D}': ` +

+`, + + + + +// ! +'\u{0021}': ` +

!

+`, + + + + +// … +'\u{2026}': ` +

+`, + + + + +// ( +'\u{0028}': ` +

(

+`, + + + + +// ) +'\u{0029}': ` +

)

+`, + + + + +// , +'\u{002C}': ` +

,

+`, + + + + +// . +'\u{002E}': ` +

.

+`, + + + + +// : +'\u{003A}': ` +

:

+`, + + + + +// ; +'\u{003B}': ` +

;

+`, + + + + +// ? +'\u{003F}': ` +

?

+`, + + + + + +} +// \ No newline at end of file diff --git a/buhd/bku-examples.js b/buhd/bku-examples.js new file mode 100644 index 000000000..f6b370f5b --- /dev/null +++ b/buhd/bku-examples.js @@ -0,0 +1,157 @@ +/* +native | meaning | IPA① | transcription | other transcriptions② | notes | wiktionary③ + + +① separate each text unit (consonant+combining_mark(s)) with §, separate phonetic syllables with . + use ‹ and › for a sound that spans 2 text units + use – for a text unit that doesn't produce sound + syllable boundary markers go inside previous unit, and emphasis markers begin emphasised unit + +② the previous transcription field is always Latin. + if there is another key orthography (eg. Mongolian cyrillic) it goes here. + vowelled/unvowelled alternatives also go here + +③ if Wiktionary spells the word differently, add the spelling here +*/ + + + + + +autoExpandExamples.bku = ` + +@ The Phonemes of the Buhid (Mangyan) Language of Eastern Mindoro, Philippines https://archive.org/details/rosettaproject_bku_phon-1/mode/2up + +ᝉᝃᝓ|nail|pa§ko|páko +ᝇᝎᝓᝑ|palm (hand)|da§lu§ha§p|dalúhap +ᝃᝐ|beside|ka§p§sa§n|kapsán +ᝊᝄᝓ|new|ba§ɣo|bágo +ᝊᝊ|wooden bar|bak§baŋ|bakbáŋ +ᝎᝊᝓ|now|la§bon|labón +ᝎᝑᝓ|skin, bark|lʌ§hob|lʌhób +ᝆᝄ|nest (domestic fowl)|ta§gan|tagán +ᝇᝆ|level|ˈdʌ§tʌg|dʌ́tʌg +ᝇᝇ|old|ˈdʌn§dan|dʌ́ndan +ᝃᝓᝃᝓ|hoe|ˈkud§kod|kúdkod +ᝆᝌ|forearm|tak§ˈjaj|takyáy +ᝃᝎᝒᝋᝓ|startle|ka§ˈli§mo|kalímo +ᝎᝓᝆᝓ|mud; ripe|ˈlu§tok|lútok +ᝄᝎᝏᝒ|scythe|ɡa§ˈla§wit|galáwit +ᝂᝇᝓ|feelings|ˈʔuɡ§doɡ|ʔúgdog +ᝊᝓᝂ|hate|bu§ˈʔot|buʔót +ᝄᝓᝂ|well|ɡubˈʔon|gubʔón +ᝋᝎᝐᝒ|white|mʌ§ʔlʌk§siʔ|mʌlʌ́ksiʔ +fᝎ|soul|ˈfa§lad|fálad +ᝅᝒᝉᝓ|tooth|ˈŋi§fon|nífon +ᝐf|stream|ˈsa§fa|sáfa +ᝑᝆ|to come|ˈhas§taj|hástay +ᝄᝋ|hand/thread|ga§ˈmʌt/ˈɡʌ§mʌs|gamʌ́t/gʌ́mʌs +ᝊᝓᝑᝄᝓ|proud|bu§ˈha§ɣod|búhagod +ᝋᝋᝒᝄᝓ|bathe|ma§ˈme§ɣus|mamégus +ᝈᝓᝋᝍᝓ|tomorrow|nu§ma§ˈrum|numarúm +ᝈᝊᝆ|watch|nʌ§bán§taj|nʌbántay +ᝋᝏᝈ|dwell|man§ˈwaj§nan|manwáynan +ᝅᝅ|chew|ˈŋas§ŋas|ŋásŋas +ᝋᝂ|eat|ˈmaŋ§on|máŋon||not entirely sure of segmentation +ᝎᝒᝎᝋᝓ|woman's garment|li§ˈlaɡ§mon|lilágmon +ᝍᝒᝍᝓ|write|ˈri§rok|rírok +ᝏᝐ|axe/for|wa§ˈsaj/wa§ˈsaɡ|wasáy/waság +ᝇᝓᝏ|two|ˈdu§waʔ|dúwaʔ +ᝄᝓᝈ|flood|ˈɡu§naw|gúnaw +ᝌfo|supper|ˈja§fon|yáfon +ᝀᝌᝓfa|centipede|ʔal§ˈjo§fan|ʔalyófan +ᝀᝊᝓᝑ|white|ʔa§ˈbu§haj|ʔabúhay +ᝐᝒᝆ|dirty|ˈsi§tʌm|sítʌm +ᝐᝒᝑᝒ|heel|si§ˈhil|sihíl +ᝐᝓᝎ|chin|ˈsu§lan|súlan +ᝀᝄᝓ|short|ʔaˈɣud|ʔagúd +ᝐᝒᝌᝓ|bamboo floor slats|ˈse§jug|séyug +ᝈᝎᝒ|hold|nʌ§ˈleɡ|nʌlég +ᝀᝊᝐ|deep|ʔʌ§bʌ§ˈsʌd|ʔʌbʌsʌ́d +ᝊᝓᝑᝒ|Buhid/lesson|bu§hid§/ˈbohin|buhid/bóhin +ᝐᝓᝑᝓ|roof|ˈso§hob|sóhob +ᝇᝄᝓ|needle|ˈda§ɡom|dágom +ᝄᝉ|kapok|ˈɡa§pas|gápas +ᝇᝄ|ground|ˈda§ɡa|dága +ᝁᝉ|girl friend|ʔi§ˈpʌɡ|ʔipʌ́g +ᝈᝎ|see|nʌ§ˈlʌɡ|nʌlʌ́g +ᝀᝊ|high|ʔa§ˈbat§/ʔʌbát|abát +ᝀᝎ|fence|ˈʔa§lad§ʔʌ́lʌd|ʔálad +ᝎᝓᝈ|calf (leg)|ˈluk§nan|lúknan +ᝊᝓ|hair|bok|bok +ᝉᝉ|cooked rice|ˈfa§fa|fáfa +ᝎᝓfo|sad|ˈlu§foɡ|lúfog +ᝄfa|thought|ˈɡaj§fan|gáyfan +ᝁᝌ|not yet|ˈʔid§ya|ʔídya +ᝊᝉ|uncle|ˈba§pa|bápa +ᝆᝌᝓ|counsel|ta§ˈjo|tayó +ᝃᝏ|on account of|ˈka§wa|káwa +fiᝌ|good|ˈfi§ja|fíya +ᝑᝓᝋᝒ|beard|ˈhu§mi|húmi +ᝋfa|lazy|ma§ˈfaŋ|mafáŋ +ᝈᝋᝓ|mosquito|na§ˈmok|namók +ᝅᝌ|name|ˈŋa§jan|ŋáyan +ᝌᝊ|breakfast|ˈya§bas|yábas +ᝋᝌ|heavy|mab§ˈjat|mabyát +ᝑᝓᝃᝓ|dig|ˈhud§kod|húdkod +ᝋᝆᝌᝓ|sharp|mʌ§ta§ˈjom|mʌtayóm +ᝋᝒᝊᝓᝎᝓ|industrious|mi§ˈbo§lon|mibólon +ᝋᝓᝌᝓ|sincere|ˈmu§joŋ|múyoŋ +ᝐᝊ|enter|ˈsak§baw|sákbaw +ᝋᝌᝏ|clear|ma§ja§waʔ|mayawaʔ +ᝋᝆᝒ|cold (water)|ma§ˈtis|matís +ᝄᝒfu|whistle|ˈgi§fol|gífol +ᝎᝆᝓᝇ|red banana|la§ˈtur§dan|latúrdan +ᝋᝎᝓ|upright|ˈmas§loŋ|másloŋ +ᝑᝐᝒ|there|ˈhʌt§si|hʌ́tsi +ᝊᝎ|house|ˈba§laj|bálay +ᝆᝊᝓ|end|ta§ˈbo|tabó +ᝁᝇᝓ|dog|ˈʔi§do|ʔído +ᝃᝓ|box|kon|kon +ᝆᝓ|knee|tod|tod +ᝃᝃᝒᝆ|but|ka§xi§ˈtaj|kakitáy + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +` + diff --git a/buhd/bku-globals.js b/buhd/bku-globals.js new file mode 100644 index 000000000..5ec992c63 --- /dev/null +++ b/buhd/bku-globals.js @@ -0,0 +1,20 @@ + + +langTag='bku' // BCP47 language tag for this orthography +scriptTag='buhd' // BCP47 script tag for this orthography +notesLangtag='bku' +blockLangtag = 'bku' // same as langTag; used in block.html +blockDirection='' // ltr/rtl or '' for ltr; used by block.html + +blockDirectoryName='buhd' // folder name where block file is found, no slash +orthogFilePath='buhd/bku' // path below /scripts, including filename, but no extension, eg. lana/nod +pickerDir='buhd' // directory name for picker, no slash at end +scriptSummaryTableName='bku' // id used for langs record in xx-langdata.js; used to make summary table +charUsageBCP='bku-buhd' // bcp tag to find the orthography in the charuse app; used in makeIndexIntro only +orthogName = 'Buhid' // natural language name for the orthography; used only in makeIndexIntro +languageName = 'Buhid' // natural language name of language; used in various places, esp block +scriptIsIndic = true // true if there are indic syllabic categories; used only in makeIndexIntro + + +defaultSize = '24px' // used by block.html to set size of font, including in font mgt panel +letterClassName = 'bku' // classname for a given orthography in the block page diff --git a/buhd/bku-langdata.js b/buhd/bku-langdata.js new file mode 100755 index 000000000..5d6979342 --- /dev/null +++ b/buhd/bku-langdata.js @@ -0,0 +1,18 @@ +// this should always be updated when app-charuse/langs.js is updated + +var langs = { + +"bku-buhd": { name:"Buhid (Bangon, Batangan, Buhid-Mangyan, Bukil)", local:"ᝊᝓᝑᝒ", localtrans:"(buhid)", +source:"3bd5a62d6d969a796148fc6c805c3eb8ac27e52d", +region:"oce", countries:"Philippines", script:"buhd", speakers:"11600", +letter:"ᝀᝁᝂᝃᝄᝅᝆᝇᝈᝉᝊᝋᝌᝍᝎᝏᝐᝑ", mark:"ᝒᝓ", number:"", punctuation:"᜵᜶", symbol:"", other:"", +orth:`Buhid  `, +also: +["bku | latn | Primary."], +type:"abugida", cs:"no", gpos:"yes", gsub:"yes", cursive:"no", wordsep:"space", baseline:"mid", wrap:"word", hyphenation:"?", direction:"ltr", justification:"?", +vowels:"vs:2 ind:3", +linked:"buhd", fonts:"buhd", font:"'Noto Sans Buhid'", +}, + + +} \ No newline at end of file diff --git a/buhd/bku-translit.js b/buhd/bku-translit.js new file mode 100755 index 000000000..c7a97f338 --- /dev/null +++ b/buhd/bku-translit.js @@ -0,0 +1,4 @@ + +autoTranslitArray.bku = + +{"\u{1735}":",","\u{1736}":".","\u{1740}":"\u{1EA1}","\u{174A}":"b","\u{1747}":"d","\u{1744}":"g","\u{1751}":"h","\u{1741}":"\u{1ECB}","\u{1752}":"i","\u{1743}":"k","\u{174E}":"l","\u{174B}":"m","\u{1748}":"n","\u{1745}":"\u{14B}","\u{1749}":"p","\u{174D}":"r","\u{1750}":"s","\u{1746}":"t","\u{1742}":"\u{1EE5}","\u{1753}":"u","\u{174F}":"w","\u{174C}":"y"} \ No newline at end of file diff --git a/buhd/bku.css b/buhd/bku.css new file mode 100755 index 000000000..f7810e90c --- /dev/null +++ b/buhd/bku.css @@ -0,0 +1,93 @@ +@font-face { + font-family: 'Noto Sans Buhid WF'; + src: url('../../shared/webfonts/notosansbuhid-regular-webfont.woff2') format('woff2'), + url('../../shared/webfonts/notosansbuhid-regular-webfont.woff') format('woff'); + font-weight: normal; + font-style: normal; + } + +#freeText { + font-size: 44px; + font-family: "Noto Sans Buhid WF"; + text-align: start; + line-height: 2; + } + +@media print { #freeText { font-size: 18px; } } + +[lang=tmp] { font-family: "Noto Sans Buhid WF"; font-size: 140%; } + + +/* optional +.listItem[lang] { + font-size: 300%; + } +.codepoint span[lang=nod], .codepoint bdi[lang=nod] { + color: black; + font-size: 3rem; + } +*/ + + + + + + + +.useBlockExamples .charExample .ex { + font-size:200%; + line-height: 1; + } +.useBlockExamples .charExample.inline .ex { + font-size: 200%; + } + +.map .charExample .ex { + font-size: 1.6rem; +} + + +.vowelSignExample bdi { + font-size:300%; + line-height:.6; + } + + + +.mapItem { + text-align: start; + } +.mapItem.initial { + border-bottom: 0; + } +.mapItem .col1, .mapItem .col2 { + margin-inline-end: 1rem; + } +.mapItem .ipa { + hyphens: none; + } +#vowel_mappings .mapItem div.col3 { + flex: 1; + } +#vowel_mappings .mapItem div.col2 { + flex: 1; + } +#vowel_mappings .mapItem div.col1 { + flex: 1; + } +#consonant_mappings .mapItem div.col3 { + flex: 3; + } +#consonant_mappings .mapItem div.col2 { + flex: 1; + text-align: end; + font-size: 2em; + } +.mapItem example { + line-height: 3; + } +.shaping bdi { + margin-inline: .5rem; + font-size: 2rem; + } + diff --git a/buhd/bku.html b/buhd/bku.html new file mode 100755 index 000000000..873e59686 --- /dev/null +++ b/buhd/bku.html @@ -0,0 +1,1849 @@ + + + + +Buhid orthography notes + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+ +
+ + + + +

Buhid

+
orthography notes
+ + + + + + + + +

Updated +17 December, 2023 + +

+ + + + + + + +
+

This page brings together basic information about the Buhid script and its use for the Buhid language. It aims to provide a brief, descriptive summary of the modern, printed orthography and typographic features, and to advise how to write Buhid using Unicode.

+ + +
+Citing this document +

Richard Ishida, Buhid Orthography Notes, 17-Dec-2023, https://r12a.github.io/scripts/buhd/bku

+
+ +

Note: Given the difficulty in finding term lists in written in the Buhid orthography, the examples cited here were derived manually by applying the rules of the orthography to Latin transcriptions. Buhid is a simple enough script that these should be reliable, except that there is a question around the representation of the consonant f. In this page we represent that sound using (click the name for more information). This tallies with usage for Baybayin.

+ + +

+ +
+ + + + + + + + + + + + + + +
+

Sample

+ +

Select part of this sample text to show a list of characters, with links to more details.
+ +Change size: 44px

+ +
+ +

ᝃᝑᝓ ᝃᝑᝓ ᝃᝓ ᝋᝎᝄᝓ
+ᝃᝊᝓᝌᝓ ᝊᝓᝌᝓ ᝐᝒ ᝂᝎᝓ
+ᝃᝇᝓᝌ ᝇᝓᝌ ᝐᝒ ᝇᝄᝓ᜵
+ᝇᝎᝃ ᝐ ᝉᝍᝓᝋᝒᝌᝓ
+ᝐᝒᝑᝋᝓ ᝃ ᝐ ᝊᝎ ᝊᝃᝓ
+ᝀᝈ ᝂᝋᝊᝓᝓ ᝃ ᝈᝒᝋᝓ᜶

+
+ +

Source: Wikipedia, Buhid urukays from The Mangyans of Mindoro by Violeta B Lopez.

+
+ + + + + + +
+

Usage & history

+ +

The Buhid language is spoken by around 11,000e Mangyans in the island of Mindoro, Philippines.

+ +

The Buhid script is currently endangered, and authorities in the area where it is spoken are trying to encourage its use by the younger generation. One particularly common former use was for writing ambahan, traditional poetry.

+ +

ᝊᝓᝑᝒ

+ +

When the Spaniards arrived in the Philippines in the 1500s they were surprised to find that the inhabitants were largely literate in scripts of which Buhid is one survivor. The scripts have the characteristics of Brahmi-derived scripts, but the pathway that led to this orthography is not clear. It it thought that it may lead via Java and have arrived in the Philippines between the 10th and 14th centuries.me

+ +

For more detailed historical information see Lorenzo Catapang.

+
+ + + + + +
+ +
+ + + + + + + +
+

Basic features

+ +

The Buhid script is an abugida. Consonants carry an inherent vowel which can be modified by appending vowel signs to the consonant. See the table to the right for a brief overview of features for the modern Buhid orthography.

+ +

Buhid text runs left-to-left in horizontal lines, and is unicameral.

+ +

Buhid has 15 consonant letters, but they are only used to indicate syllable onsets. Syllable codas are not written. This can lead to some word ambiguity, and also means also that the text doesn't indicate any consonant clusters. ❯ consonants

+ +

The Buhid orthography is an abugida with one inherent vowel, generally pronounced a, but sometimes ʌ. Vowels are written using only 2 vowel signs (for 4 sounds), and no consonants. ❯ vowels

+ +

Buhid has 3 independent vowels, used for vowels that are preceded by a glottal stop. These may occur word-initially or word-medially. ❯ standalone

+
+ + + + + + + + + +
+

Character index

+ + + + +
+ + + + + +
+

Letters

+
+Show + + +
+

Consonants

+
ᝃ␣ᝄ␣ᝅ␣ᝆ␣ᝇ␣ᝈ␣ᝉ␣ᝊ␣ᝋ␣ᝌ␣ᝍ␣ᝎ␣ᝏ␣ᝐ␣ᝑ
+
+ +
+

Vowels

+
ᝀ␣ᝁ␣ᝂ
+
+
+
+ + + +
+

Combining marks

+
+Show + + +
+

Vowels

+
ᝒ␣ᝓ
+
+
+
+ + + + + + + + + + + +
+

Punctuation

+
+Show + +
᜵␣᜶
+
+
+ + + + + + + + + + + + + +
+ + + + + + + +
+
+Items to show in lists +
+
+
+
+
+
+
+ + + + + + + +
+

Phonology

+ +

The following represents the repertoire of the Buhid language.

+

Click on the sounds to reveal locations in this document where they are mentioned.

+

Phones in a lighter colour are non-native or allophones. Source Barham.

+ + + + +
+

Vowel sounds

+ + +
+

Plain vowels

+ + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + i + u + + + e + o + + + ʌ + ʌ + + + + a + +
+ + +

a and ʌ are sometimes interchangeable.

+
+ + + + + + +
+

Consonant sounds

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
labial dental alveolar palatal velar glottal
stopp bt d  k ɡʔ
fricative f s x ɣh
nasalm n ŋ
approximantw lj 
trill/flap  r
+
+ + + + + + +
+

Tone

+ +

Buhid is not a tonal language.

+
+ + + + + +
+

Structure

+ +

Barhammb reports 2 syllable types:

+
CV | CVC
+ + + +

These are combined into words with the following structures:

+
CVC | CVCV | CVCVC |CVCCVC | CVCCV
+ + +

Barham reportsmb,9 that certain Tagalog words with the structure CVCVC have corresponding words in Buhid with the structure CVC where there is a tendency to lengthen the single vowel, but only in slow speech.

+ +

The following restrictions apply:

+
+
Onset
+
p only appears in loan words. Otherwise all consonants can appear.
+
Nucleus
Includes any vowel.
+
Coda
Can be any consonant except f and h.
+
+ +

Barham (p8) provides additional detail about which consonant sequences can appear in clusters.

+
+
+ + + + + + + +

+ + + + + + + + +

+ +
+

Vowels

+ + +
+

The following features are not found in the Buhid orthography.

+ +
    +
  • No consonants are used to create vowel sounds.
  • +
  • There are no pre-base vowels or circumgraphs, nor are there any multipart vowels.
  • +
  • Vowel length is not marked.
  • +
  • Nasalisation is not a feature of the Buhid language.
  • +
  • Buhid is not a tonal language.
  • +
  • The Buhid orthography has no way to indicate consonants that are not followed by a vowel.
  • +
+
+ + +
+ + + + + + + +
+

Vowel summary

+ +

ⓘ represents the inherent vowel. The left column shows dependent vowels, and the right independent.

+ + + + + + + + + + + + + + + + + +
Simple:
ᝒ␣␣ᝓ
ᝁ␣ ␣ᝂ
ᝒ␣␣ᝓ
ᝁ␣ ␣ᝂ
+ + +

For additional details see vowel_mappings.

+
+ + + + + + + + + + +
+

Inherent vowel

+ +

+ + ka + U+1743 LETTER KA +

+ +

+ +

a following a consonant is not written, but is seen as an inherent part of the consonant letter, so ka is written by simply using the consonant letter.

+
+ + + + + + + + +
+

Combining marks used for vowels

+ +

+ ᝃᝒ + ki + U+1743 LETTER KA + U+1752 VOWEL SIGN I +

+ +

Buhid uses only two combining marks for vowels when it is necessary to override the inherent vowel.

+ +
ᝒ␣ᝓ
+ +

Each vowel sign represents one of 2 sounds. 1752 represents either the sound i or the sound e; 1753 represents either o or u.

+ +

In principle, the glyphs look the same, and the distinction is made by position: i ~ e goes above the base, and o ~ u goes below. However, in practise, although the relative height distinction is always preserved, the way the vowel sign connects with the base varies from consonant to consonant. The differences are significant enough to make it worthwhile to show all possible combinations in the table below.

+ + + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + +
ConsonantNo vowel signWith i/eWith o/u
pᝉᝒᝉᝓ
bᝊᝒᝊᝓ
tᝆᝒᝆᝓ
dᝇᝒᝇᝓ
kᝃᝒᝃᝓ
ɡᝄᝒᝄᝓ
sᝐᝒᝐᝓ
hᝑᝒᝑᝓ
mᝋᝒᝋᝓ
nᝈᝒᝈᝓ
ŋᝅᝒᝅᝓ
wᝏᝒᝏᝓ
rᝍᝒᝍᝓ
lᝎᝒᝎᝓ
jᝌᝒᝌᝓ
+
Placement of vowel signs with Buhid consonants.
+
+ + +
+ + + + + + + +
+

Standalone vowels

+ +

+ + a + U+1740 LETTER A +

+ +

+ +
ᝀ␣ᝁ␣ᝂ
+ +

Vowels at the beginning of a word or following another vowel are actually transcribed in IPA with a preceding glottal stop (ʔ), but they are written using one of 3 independent vowel letters.

+ +

As with the vowel signs, these letters each represent one of two possible sounds. (See the box above.)

+ +

ᝀᝊᝓᝑ

+

ᝁᝇᝓ

+

ᝄᝓᝂ

+
+ + + + + + + + + + + +
+

Vowel sounds to characters

+ + +

This section maps Buhid vowel sounds to common graphemes in the Buhid orthography.

+ +

The left column shows dependent vowels; the right column shows independent vowel letters.

+ +

Sounds listed as 'infrequent' are allophones, or sounds used for foreign words, etc.

+ + + + + + + +
+

Plain vowels

+ +
+
+
i
+
 
+
+

1752

+

ᝐᝒᝆ

+
+
+

1741

+

ᝁᝇᝓ

+
+
+ +
+
u
+
 
+
+

1753

+

ᝎᝓᝆᝓ

+
+
+

1742

+

ᝂᝇᝓ

+
+
+
+
+ + + + + +
+
+
e
+
 
+
+

1752

+

ᝈᝎᝒ

+
+
+

1741

+

+
+
+ +
+
o
+
 
+
+

1753

+

ᝐᝓᝑᝓ

+
+
+

1742

+

ᝄᝓᝂ

+
+
+
+ + + + + +
+
+
a
+
 
+
+

Inherent vowel

+

ᝆᝊᝓ

+
+
+

1740

+

ᝀᝊᝓᝑ

+
+
+ +
+
ʌ
+
 
+
+

Inherent vowel

+

ᝇᝆ

+
+
+

1740

+

ᝀᝊᝐ

+
+
+
+
+ + + + + + + +
+
+ + + + + + + + + + +

+ + +

+ + + +
+

Consonants

+ + +
+

The following features are not found in the Buhid orthography.

+ + +
+ + + + +
+ + + + + + + + + + + + + + +
+

Basic consonants

+ +

Buhid consonants are few and simple. There is no repertoire extension mechanism.

+ +
ᝉ␣ᝊ␣ᝆ␣ᝇ␣ᝃ␣ᝄ
+
ᝐ␣ᝑ
+
ᝋ␣ᝈ␣ᝅ
+
ᝏ␣ᝍ␣ᝎ␣ᝌ
+ + +

may be pronounced x when word-medial and before a vowel; likewise, may be pronounced ɣ.

+ + + +
+

The f phoneme

+ +

The phonetic transcriptions by Barhammb indicate common use of the phoneme f, but no character for that sound exists in the Buhid Unicode block. The Unicode proposal document mentions a possible character for f introduced during a script reform, but doesn't propose anything because it is 'wanting attestation'. Room was left in the block for later additions, if necessary.

+ +

It has been difficult to find evidence of how this sound is written, but Satots mentions that in Philippine Latin orthography f is usually written as p. This page therefore uses 1749 to represent this sound. This needs to be checked against actual usage.

+
+
+ + + + + + + +
+

Onsets

+ +

Buhid syllable onsets are straightforward. They don't involve consonant clusters.

+
+ + + + + + +
+

Finals

+ +

Like some other neighouring scripts, the syllable codas are not written in the Buhid orthography. This, of course, can lead to a certain amount of ambiguity. Examples:

+ +

ᝄᝋ

+

ᝏᝐ

+
+ + + + + + +
+

Consonant clusters

+ +

+

+ +

Buhid has no conjuncts or other special mechanisms for handling consonant cluster, which only occur normally when a syllable with a code precedes a syllable with a consonant onset.

+
+ + + + + + + + + + + + + + + +
+

Consonant sounds to characters

+ +

This section maps Buhid consonant sounds to common graphemes in the Buhid orthography.

+ +

Syllable-final consonants are never written. The right-hand column shows the shape alone, combined with vowel sign I, and combined with vowel sign U, respectively.

+ +

Click on a grapheme to find other mentions on this page (links appear at the bottom of the page). Click on the character name to see examples and for detailed descriptions of the character(s) shown.

+ +

Sounds listed as 'infrequent' are allophones, or sounds used for foreign words, etc.

+ + + + +
+

Stops

+
+ +
+
p
+
 
+
+

1749

+

ᝉᝃᝓ

+
+
+

ᝉ ᝉᝒ ᝉᝓ

+
+
+ +
+
b
+
 
+
+

174A

+

ᝊᝄᝓ

+
+
+

ᝊ ᝊᝒ ᝊᝓ

+
+
+ +
+
t
+
 
+
+

1746

+

ᝆᝊᝓ

+
+
+

ᝆ ᝆᝒ ᝆᝓ

+
+
+ +
+
d
+
 
+
+

1747

+

ᝇᝄ

+
+
+

ᝇ ᝇᝒ ᝇᝓ

+
+
+ +
+
k
+
 
+
+

1743

+

ᝃᝏ

+
+
+

ᝃ ᝃᝒ ᝃᝓ

+
+
+ +
+
ɡ
+
 
+
+

1743

+

ᝄᝓᝂ

+
+
+

ᝄ ᝄᝒ ᝄᝓ

+
+
+
+
+ + + + + + +
+

Fricatives

+
+ +
+
f
+
 
+
+

1749 This has to be checked!

+

ᝉᝉ

+
+
+

ᝉ ᝉᝒ ᝉᝓ

+
+
+ +
+
s
+
 
+
+

1750

+

ᝐᝓᝎ

+
+
+

ᝐ ᝐᝒ ᝐᝓ

+
+
+ +
+
x
+
 
+
+

1743 when word-medial and followed by a vowel.

+

ᝃᝃᝒᝆ

+
+
+

ᝃ ᝃᝒ ᝃᝓ

+
+
+ +
+
ɣ
+
 
+
+

1744 when word-medial and followed by a vowel.

+

ᝀᝄᝓ

+
+
+

ᝄ ᝄᝒ ᝄᝓ

+
+
+ +
+
h
+
 
+
+

1751

+

ᝑᝓᝋᝒ

+
+
+

ᝑ ᝑᝒ ᝑᝓ

+
+
+
+
+ + + + + + +
+

Nasals

+
+ +
+
m
+
 
+
+

174B

+

ᝋᝒᝊᝓᝎᝓ

+
+
+

ᝋ ᝋᝒ ᝋᝓ

+
+
+ +
+
n
+
 
+
+

1748

+

ᝈᝓᝋᝍᝓ

+
+
+

ᝈ ᝈᝒ ᝈᝓ

+
+
+ +
+
ŋ
+
 
+
+

1745

+

ᝅᝒᝉᝓ

+
+
+

ᝅ ᝅᝒ ᝅᝓ

+
+
+
+
+ + + + +
+

Other sonorants

+
+ +
+
w
+
 
+
+

174F

+

ᝄᝎᝏᝒ

+
+
+

ᝏ ᝏᝒ ᝏᝓ

+
+
+ +
+
r
+
 
+
+

174D

+

ᝍᝒᝍᝓ

+
+
+

ᝍ ᝍᝒ ᝍᝓ

+
+
+ +
+
l
+
 
+
+

174E

+

ᝎᝓᝆᝓ

+
+
+

ᝎ ᝎᝒ ᝎᝓ

+
+
+ +
+
j
+
 
+
+

174C

+

ᝐᝒᝌᝓ

+
+
+

ᝌ ᝌᝒ ᝌᝓ

+
+
+
+
+
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+

Numbers

+ +

The Buhid Unicode block doesn't have a set of native digits.

+
+ + + + + + + + + +
+

Text direction

+ +

Buhid text runs left to right in horizontal lines.

+ +

Eversonme reports that the writing often runs bottom to top on lines that progress from left to right. However, the letter glyphs are rotated in this case, so this is simply a rotation of the medium, rather than a different writing direction. It makes it easier to fit the writing on bamboo strips.

+ +

Show default bidi_class properties for characters in the Buhid orthography described here.

+
+ + + + + + + + + +

+ + +

+ + + + + + +
+

Glyph shaping & positioning

+ + + +
+

The following features are not found in the Buhid orthography.

+ + +
+ + + + + + + +

This section brings together information about the following topics: +writing styles; +cursive text; +context-based shaping; +context-based positioning; +baselines, line height, etc.; +font styles; +case & other character transforms. +

+ +

You can experiment with examples using the Buhid character app.

+ + + + + + +
+

Context-based shaping & positioning

+ +

Buhid letters don't interact with each other, but the placement of the vowel signs requires context-sensitive placement, and in some cases reshaping of the letter. The various combinations are shown in dependent_vowel_table.

+

Buhid has no multiple combining marks, or other shaping to consider.

+
+ + + + + + + +
+

Letterform slopes, weights, & italics

+

tbd

+ + + +

Since it is very hard to find any printed examples of Buhid text, it is likely that there is no standard approach to the use of oblique and bold forms, if they are used at all. The Noto Buhid font has only a regular face.

+
+
+ + + + + + + + +
+

Graphemes

+ +

+

+ +

Buhid is a simple orthography and typographic units can be easily segmented using grapheme clusters.

+ +

Phrase, sentence, and section delimiters are described in phrase.

+ + + + +
+

Grapheme clusters

+ + +

Base Combining_mark*

+ +

Buhid typographic units consist of a letter or a letter with a single combining mark (one of two vowel signs). Both of these units fit the definition of a grapheme cluster.

+ +

As previously noted, syllable codas are not written in Buhid text, and so the segmentation only captures onsets and the syllable nucleus.

+
+
+
+

Punctuation & inline features

+ + + + +
+

Word boundaries

+

+ +

Words are separated by spaces.

+
+ + + + + + + +
+

Phrase & section boundaries

+ + + + +
᜵␣᜶
+ +

Buhid uses for a short pause, and for a longer or sentence-like pause. It may also be used at the end of a poem.

+ + + + + + + + + + + + +
phrase +
sentence +
+
+ + + + + +
+

Bracketed text

+

tbd

+ +
+ + + + + + +
+

Quotations & citations

+

tbd

+ +
+ + + + + +
+

Emphasis

+

tbd

+
+ + + + + +
+

Abbreviation, ellipsis & repetition

+

tbd

+ + +
+ + + + + +
+

Inline notes & annotations

+

tbd

+
+ + + + + +
+

Other punctuation

+ +

tbd

+
+ + + + + +
+

Other inline text decoration

+ +

tbd

+
+
+ + + + + + + + + + +
+

Line & paragraph layout

+ + +
+

Line breaking & hyphenation

+

tbd

+ + + + + + + + + +
+

In-word line-breaking

+

tbd

+
+ + + + + + + +
+

Line-edge rules

+ +

As in almost all writing systems, certain punctuation characters should not appear at the end or the start of a line. The Unicode line-break properties help applications decide whether a character should appear at the start or end of a line.

+ +

Show line-breaking properties for characters in the Buhid orthography.

+ + +
+
+ + + + + + + + +
+

Text alignment & justification

+ + + +

tbd

+
+ + + + + + + +
+

Text spacing

+ + + +

tbd

+
+ + + + +
+

Baselines, line height, etc.

+ +

Buhid uses the so-called 'alphabetic' baseline, which is the same as for Latin and many other scripts.

+ +

Buhid letters vary slightly in height but are mostly around the same, with no ascenders or descenders. Vowel signs may appear above or below some letters, but these are on horizontal dashes.

+ +

To give an approximate idea, fig_baselines compares Latin and Buhid glyphs from the Noto Sans font. The basic height of Buhid letters is typically around the Latin x-height, however some taller letters and combining marks can reach just beyond the Latin ascenders (but not the descenders), creating a need for slightly larger line spacing.

+ + +
+
+Hhqxᝉᝇᝏᝒᝌᝒᝐᝒᝁ᜶ +
+
Font metrics for Latin text compared with Buhid glyphs in the Noto Sans Buhid font.
+
+
+ + + + + + + + + +
+

Counters, lists, etc.

+ +

tbd

+
+ + + + + + +
+

Styling initials

+

tbd

+ +
+
+ + + + + + + + + + +
+

Page & book layout

+ +

This section is for any features that are specific to XXXX and that relate to the following topics: +general page layout & progression; +grids & tables; +notes, footnotes, etc; +forms & user interaction; +page numbering, running headers, etc. +

+ + + + + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+

References

+
+ + + + + + + + + + + +
+ + + + + + diff --git a/buhd/bku/fig_baselines_noto_sans.png b/buhd/bku/fig_baselines_noto_sans.png new file mode 100644 index 000000000..1f33f3082 Binary files /dev/null and b/buhd/bku/fig_baselines_noto_sans.png differ diff --git a/buhd/bku_vocab.html b/buhd/bku_vocab.html new file mode 100755 index 000000000..82f47ab31 --- /dev/null +++ b/buhd/bku_vocab.html @@ -0,0 +1,84 @@ + + + + +Vocab lister + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+ +
+ + +
+ +
+ + + +
+Licence CC-By © r12a + +
+ + + + + diff --git a/buhd/block-globals.js b/buhd/block-globals.js new file mode 100644 index 000000000..64777ed72 --- /dev/null +++ b/buhd/block-globals.js @@ -0,0 +1,11 @@ + +window.version = 'v29' +window.scriptName = 'Buhid' +window.ghDirectory = 'buhd' +window.blockDirectory = 'buhd' +window.languageList = ['bku'] // lang tags for each orthography handled +window.detailsfileList = ['bku'] // first part of xx-details for each orthography +window.scriptISO = 'buhd' +window.webfonts = ["Noto Sans Buhid WF"] +window.defaultSize = '24px' + diff --git a/buhd/block.html b/buhd/block.html new file mode 100755 index 000000000..a21569eec --- /dev/null +++ b/buhd/block.html @@ -0,0 +1,237 @@ + + + + +Buhid character notes + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+
+ +
+ +

Buhid character notes

+ + + + + + + + + + + +
+

+ + + + + +

This page lists characters used in orthographies based on the Buhid script and provides information about them.

+ +

Character notes have companion pages that summarise how a script is used for a specific orthography. For the Buhid script, see Buhid.

+ + +

The examples used in this page are constructed from Latin transcriptions, following the rules of the script. It is possible that one or two items may be incorrect.

+ + +
+Referencing this document +

Richard Ishida, Buhid Character Notes, 17-Dec-2023, https://r12a.github.io/scripts/buhd/block

+
+ + +

+ +
+ + + + + + + +
+

Buhid block

+ + + +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ + +
+ + + + + + + + +
+

Hanunoo block

+ +
+ +
+
+ + + + + + + + + + + +
+

References

+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + diff --git a/buhd/refs.js b/buhd/refs.js new file mode 100644 index 000000000..75873ec7c --- /dev/null +++ b/buhd/refs.js @@ -0,0 +1,130 @@ +window.langSet = false + + + +reflist = { + +/* +"auth_initials": { +"authors": "Sort_by_family_name_of_first_contributor", +"title":"The_Worlds_Writing_Systems", +"sub": "subtitle", +"date": "1996", +"retr": "May 2021", +"publisher":"Oxford_University_Press", +"isbn":"0-19-507993-0", +"pages": "xxx", +"url":"refs", +"lang": new Set(['ru']), +"reviewed":false +}, +*/ + +"mb": { +"authors": "R Marie Barham", +"title":"The Phonemes of the Buhid (Mangyan) Language of Eastern Mindoro, Philippines", +"date": "1955", +"retr": "Dec 2023", +"publisher":"Rosetta Project", +"url":"https://archive.org/details/rosettaproject_bku_phon-1/mode/2up", +"reviewed":false +}, + +"ts": { +"authors": "Takayuki K. Sato", +"title":"Philippino characters (status report)", +"date": "2000", +"retr": "May 2021", +"publisher":"ISO/IEC JTC/1 SC/2 WG/2 N2194", +"url":"https://www.unicode.org/L2/L2000/00097-n2194.pdf", +"reviewed":false +}, + +"me": { +"authors": "Michael Everson", +"title":"9.16 Philippine Scripts", +"sub": "New draft for Philippine script with block introduction", +"date": "2000", +"url":"https://www.unicode.org/L2/L2000/00357-philippine.pdf", +"reviewed":false +}, + +"u": { +"authors": "Unicode Consortium", +"title":"The Unicode Standard, Version 15.0", +"sub":"Chapter 17.1: Philippine Scripts", +"pages":"710-712", +"isbn":"978-1-936213-16-0.", +"url":"https://www.unicode.org/versions/Unicode15.0.0/ch17.pdf", +"reviewed": false +}, + +"elc": { +"authors": "Emerenciana Lorenzo Catapang", +"title":"Reviving the Hanunuo and Buhid Mangyan Scripts of the Philippines", +"url":"https://lingdy.aa-ken.jp/wp-content/uploads/2014/02/140227-intl-symp-and-ws_emerenciana_lorenzo_catapang_paper.pdf", +"reviewed":false +}, + +"wl": { +"authors": "Wikipedia", +"title":"Buhid language", +"retr": "Dec 2023", +"url":"https://en.wikipedia.org/wiki/Buhid_language", +"reviewed":false +}, + +"ws": { +"authors": "Wikipedia", +"title":"Buhid script", +"retr": "Dec 2023", +"url":"https://en.wikipedia.org/wiki/Buhid_script", +"reviewed":false +}, + +"e": { +"authors": "Eberhard, David M., Gary F. Simons, and Charles D. Fennig (eds.)", +"title":"Ethnologue: Languages of the World. Twenty-sixth edition", +"date": "2023", +"retr": "Dec 2023", +"publisher":"SIL International", +"url":"https://www.ethnologue.com/language/bku/", +"reviewed":true +}, + +} + + + + +scriptLanguageList = { +aio:{name:"Buhid"}, +} + + + + + + +terms = { + +"i": { +"url":"https://tal.ircam.ma/tamawalt/alphabet_p.php", +"authors": "ERCIM", +"title":"ⵜⴰⵎⴰⵡⴰⵍⵜ ⵏ ⵉⵎⵥⵥⵢⴰⵏⵏ", +}, + +"a": { +"url":"https://amawal.net/about", +"authors": "?", +"title":"ⴰⵎⴰⵡⴰⵍ The Berber dictionary", +"notes":"Latin only", +}, + + +} + + + + +