view test-data/sample_text_frequency.dat @ 0:e991d4e60c17 draft

planemo upload commit 0203cb3a0b40d9348674b2b098af805e2986abca-dirty
author stevecassidy
date Wed, 12 Oct 2016 22:17:53 -0400
parents
children
line wrap: on
line source

Word	Count	Percent
the	44	6.32
of	26	3.74
and	25	3.59
.	24	3.45
to	23	3.30
a	15	2.16
,	12	1.72
for	12	1.72
will	12	1.72
is	11	1.58
DADA	9	1.29
some	8	1.15
(	7	1.01
be	7	1.01
on	7	1.01
that	7	1.01
this	7	1.01
Australian	7	1.01
)	7	1.01
The	7	1.01
text	6	0.86
project	6	0.86
we	6	0.86
infrastructure	6	0.86
from	6	0.86
have	6	0.86
in	6	0.86
video	5	0.72
language	5	0.72
data	5	0.72
it	5	0.72
collection	5	0.72
annotation	5	0.72
Corpus	4	0.57
with	4	0.57
build	4	0.57
audio	4	0.57
hope	3	0.43
collections	3	0.43
resources	3	0.43
funding	3	0.43
available	3	0.43
English	3	0.43
meta-data	3	0.43
Macquarie	3	0.43
done	3	0.43
two	3	0.43
corpus	3	0.43
part	3	0.43
work	3	0.43
up	3	0.43
at	3	0.43
-	3	0.43
code	2	0.29
people	2	0.29
We	2	0.29
but	2	0.29
has	2	0.29
them	2	0.29
example	2	0.29
words	2	0.29
using	2	0.29
now	2	0.29
collect	2	0.29
each	2	0.29
corpora	2	0.29
year	2	0.29
server	2	0.29
new	2	0.29
public	2	0.29
by	2	0.29
search	2	0.29
store	2	0.29
involves	2	0.29
within	2	0.29
texts	2	0.29
support	2	0.29
Language	2	0.29
sentences	2	0.29
freely	2	0.29
National	2	0.29
funded	2	0.29
site	2	0.29
an	2	0.29
as	2	0.29
able	2	0.29
make	2	0.29
subjects	2	0.29
speech	2	0.29
development	2	0.29
recording	2	0.29
I	2	0.29
significant	2	0.29
task	2	0.29
provide	2	0.29
ARC	2	0.29
demo	1	0.14
automatically	1	0.14
What	1	0.14
Service	1	0.14
being	1	0.14
both	1	0.14
soon	1	0.14
existing	1	0.14
large	1	0.14
via	1	0.14
looks	1	0.14
Haugh	1	0.14
still	1	0.14
find	1	0.14
alignment	1	0.14
web	1	0.14
Recently	1	0.14
writing	1	0.14
linguistics	1	0.14
only	1	0.14
going	1	0.14
systems	1	0.14
under	1	0.14
Using	1	0.14
2011	1	0.14
take	1	0.14
move	1	0.14
around	1	0.14
get	1	0.14
read	1	0.14
providing	1	0.14
Michael	1	0.14
number	1	0.14
Project	1	0.14
next	1	0.14
While	1	0.14
Oz	1	0.14
communities	1	0.14
comes	1	0.14
projects	1	0.14
articles	1	0.14
like	1	0.14
visible	1	0.14
manual	1	0.14
solution	1	0.14
've	1	0.14
capability	1	0.14
these	1	0.14
continue	1	0.14
steps	1	0.14
common	1	0.14
small	1	0.14
Speech	1	0.14
fixed	1	0.14
Griffith	1	0.14
searching	1	0.14
core	1	0.14
doing	1	0.14
Since	1	0.14
idea	1	0.14
All	1	0.14
titles	1	0.14
are	1	0.14
picked	1	0.14
Some	1	0.14
network	1	0.14
renamed	1	0.14
managing	1	0.14
sites	1	0.14
publish	1	0.14
research	1	0.14
Later	1	0.14
AusNC	1	0.14
written	1	0.14
between	1	0.14
technology	1	0.14
reading	1	0.14
can	1	0.14
recently	1	0.14
repository	1	0.14
partners	1	0.14
This	1	0.14
University	1	0.14
hosted	1	0.14
free	1	0.14
box	1	0.14
exposing	1	0.14
technical	1	0.14
study	1	0.14
allows	1	0.14
forced	1	0.14
Sign	1	0.14
published	1	0.14
map	1	0.14
MQ	1	0.14
month	1	0.14
interviews	1	0.14
software	1	0.14
already	1	0.14
useful	1	0.14
secure	1	0.14
'black	1	0.14
primary	1	0.14
whatever	1	0.14
Update	1	0.14
1000	1	0.14
parties	1	0.14
loaded	1	0.14
centralised	1	0.14
Auslan	1	0.14
1900	1	0.14
size	1	0.14
little	1	0.14
Australia	1	0.14
initial	1	0.14
been	1	0.14
Early	1	0.14
their	1	0.14
station	1	0.14
down	1	0.14
basic	1	0.14
collected	1	0.14
:	1	0.14
Data	1	0.14
ANDS	1	0.14
more	1	0.14
describe	1	0.14
HCSNet	1	0.14
denoting	1	0.14
interviewed	1	0.14
Trevor	1	0.14
bitbucket	1	0.14
testing	1	0.14
Johnston	1	0.14
effort	1	0.14
pilot	1	0.14
upgrades	1	0.14
main	1	0.14
look	1	0.14
developing	1	0.14
reliable	1	0.14
pace	1	0.14
while	1	0.14
technoogy	1	0.14
install	1	0.14
Our	1	0.14
transcripts	1	0.14
country	1	0.14
descriptions	1	0.14
due	1	0.14
documentation	1	0.14
allowed	1	0.14
sample	1	0.14
enable	1	0.14
create	1	0.14
demonstration	1	0.14
Map	1	0.14
speakers	1	0.14
inside	1	0.14
end	1	0.14
sessions	1	0.14
things	1	0.14
permission	1	0.14
feature	1	0.14
who	1	0.14
started	1	0.14
which	1	0.14
digital	1	0.14
many	1	0.14
outside	1	0.14
used	1	0.14
's	1	0.14
separate	1	0.14
collaboration	1	0.14
after	1	0.14
driver	1	0.14
needs	1	0.14
moment	1	0.14
important	1	0.14
designed	1	0.14
tidying	1	0.14
services	1	0.14
elicit	1	0.14
AusTalk	1	0.14
expand	1	0.14
stereo	1	0.14
natural	1	0.14
'	1	0.14
third	1	0.14
later	1	0.14
game	1	0.14
An	1	0.14
As	1	0.14
so	1	0.14
Big	1	0.14
allow	1	0.14
sets	1	0.14