mirror of
https://github.com/cc65/cc65.git
synced 2024-11-05 08:05:51 +00:00
192 lines
3.9 KiB
C
192 lines
3.9 KiB
C
/*
|
|
!!DESCRIPTION!! print character frequencies
|
|
!!ORIGIN!! LCC 4.1 Testsuite
|
|
!!LICENCE!! own, freely distributeable for non-profit. read CPYRIGHT.LCC
|
|
*/
|
|
|
|
/*
|
|
cf - print character frequencies
|
|
*/
|
|
|
|
#include "common.h"
|
|
|
|
#include <stdlib.h>
|
|
#include <stdio.h>
|
|
#include <ctype.h>
|
|
|
|
FILE *in;
|
|
|
|
#define INFILE "cf.in"
|
|
#define GETCHAR() fgetc(in)
|
|
|
|
#ifndef NO_FLOATS
|
|
float f[0x100];
|
|
#else
|
|
signed f[0x100];
|
|
#endif
|
|
|
|
#ifdef NO_OLD_FUNC_DECL
|
|
int main(int argc,char **argv)
|
|
#else
|
|
main(argc, argv)
|
|
int argc;
|
|
char *argv[];
|
|
#endif
|
|
{
|
|
int i, c, nc;
|
|
#ifndef NO_FLOATS
|
|
float cutoff, atof();
|
|
#else
|
|
signed cutoff;
|
|
#endif
|
|
|
|
in = fopen(INFILE, "rb");
|
|
if (in == NULL) {
|
|
return EXIT_FAILURE;
|
|
}
|
|
|
|
if (argc <= 1)
|
|
#ifndef NO_FLOATS
|
|
cutoff = 0.0;
|
|
#else
|
|
cutoff = 0;
|
|
#endif
|
|
else
|
|
#ifndef NO_FLOATS
|
|
cutoff = atof(argv[1])/100;
|
|
#else
|
|
cutoff = atoi(argv[1])/100;
|
|
#endif
|
|
for (i = 0; i < 0x100; )
|
|
{
|
|
#ifndef NO_FLOATS
|
|
f[i++] = 0.0;
|
|
#else
|
|
f[i++] = 0;
|
|
#endif
|
|
}
|
|
|
|
printf("input:\n\n");
|
|
|
|
nc = 0;
|
|
while ((c = GETCHAR()) != -1)
|
|
{
|
|
/* printf("[%02x]",c); */
|
|
printf("%c",c);
|
|
f[c] += 1;
|
|
nc++;
|
|
}
|
|
printf("\n\ncount: %d\n\n",nc);
|
|
|
|
/*
|
|
now try to print a report in a way so that
|
|
the order is somewhat independent from the
|
|
target character set
|
|
*/
|
|
|
|
printf("a-z char:freq\n\n");
|
|
|
|
/* first round ... lowercase characters */
|
|
for (i = 0; i < 0x100; ++i)
|
|
{
|
|
if ((f[i]) && ((f[i]/nc) >= cutoff))
|
|
{
|
|
if ((i >= 'a') && (i <= 'z'))
|
|
{
|
|
printf("%c", i);
|
|
#ifndef NO_FLOATS
|
|
printf(":%.1f\n", 100*f[i]/nc);
|
|
#else
|
|
printf(":%d\n", 100*f[i]/nc);
|
|
#endif
|
|
f[i]=0;
|
|
}
|
|
}
|
|
}
|
|
|
|
printf("A-Z char:freq\n\n");
|
|
|
|
/* second round ... uppercase characters */
|
|
for (i = 0; i < 0x100; ++i)
|
|
{
|
|
if ((f[i]) && ((f[i]/nc) >= cutoff))
|
|
{
|
|
if ((i >= 'A') && (i <= 'Z'))
|
|
{
|
|
printf("%c", i);
|
|
#ifndef NO_FLOATS
|
|
printf(":%.1f\n", 100*f[i]/nc);
|
|
#else
|
|
printf(":%d\n", 100*f[i]/nc);
|
|
#endif
|
|
f[i]=0;
|
|
}
|
|
}
|
|
}
|
|
|
|
printf("0-9 char:freq\n\n");
|
|
|
|
/* third round ... numbers */
|
|
for (i = 0; i < 0x100; ++i)
|
|
{
|
|
if ((f[i]) && ((f[i]/nc) >= cutoff))
|
|
{
|
|
if ((i >= '0') && (i <= '9'))
|
|
{
|
|
printf("%c", i);
|
|
#ifndef NO_FLOATS
|
|
printf(":%.1f\n", 100*f[i]/nc);
|
|
#else
|
|
printf(":%d\n", 100*f[i]/nc);
|
|
#endif
|
|
f[i]=0;
|
|
}
|
|
}
|
|
}
|
|
|
|
printf("isprint char:freq\n\n");
|
|
|
|
/* second last round ... remaining printable characters */
|
|
for (i = 0; i < 0x100; ++i)
|
|
{
|
|
if ((f[i]) && ((f[i]/nc) >= cutoff))
|
|
{
|
|
if(isprint(i))
|
|
{
|
|
printf("%c", i);
|
|
#ifndef NO_FLOATS
|
|
printf(":%.1f\n", 100*f[i]/nc);
|
|
#else
|
|
printf(":%d\n", 100*f[i]/nc);
|
|
#endif
|
|
f[i]=0;
|
|
}
|
|
}
|
|
}
|
|
|
|
printf("rest char:freq\n\n");
|
|
|
|
/* last round ... remaining non printable characters */
|
|
for (i = 0; i < 0x100; ++i)
|
|
{
|
|
if ((f[i]) && ((f[i]/nc) >= cutoff))
|
|
{
|
|
if(i=='\n')
|
|
{
|
|
printf("newline");
|
|
}
|
|
else
|
|
{
|
|
printf("%03o", i);
|
|
}
|
|
#ifndef NO_FLOATS
|
|
printf(":%.1f\n", 100*f[i]/nc);
|
|
#else
|
|
printf(":%d\n", 100*f[i]/nc);
|
|
#endif
|
|
}
|
|
}
|
|
fclose(in);
|
|
return 0;
|
|
}
|