[Top][All Lists]
[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]
[GNUnet-SVN] r648 - Extractor-docs/WWW GNUnet-docs/WWW i18nHTML-docs/WWW
From: |
grothoff |
Subject: |
[GNUnet-SVN] r648 - Extractor-docs/WWW GNUnet-docs/WWW i18nHTML-docs/WWW i18nHTML-docs/WWW/download |
Date: |
Sun, 10 Apr 2005 23:58:58 -0700 (PDT) |
Author: grothoff
Date: 2005-04-10 23:58:51 -0700 (Sun, 10 Apr 2005)
New Revision: 648
Added:
i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.bz2
i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.gz
Modified:
Extractor-docs/WWW/index.php
GNUnet-docs/WWW/index.php
i18nHTML-docs/WWW/index.php
Log:
revert
Modified: Extractor-docs/WWW/index.php
===================================================================
--- Extractor-docs/WWW/index.php 2005-04-11 06:52:55 UTC (rev 647)
+++ Extractor-docs/WWW/index.php 2005-04-11 06:58:51 UTC (rev 648)
@@ -1,199 +1,108 @@
<?php
-include("i18nhtml.inc");
-DOCTYPE("HTML", "Transitional");
-echo "<html><head>\n";
-if ($title) {
- echo "<title>";
- TRANSLATE("Doodle: find information on your computer");
- echo "</title>";
- }
-if ($description) {
- echo "<meta name=\"description\" content=\"";
- TRANSLATE("A tool to index and search the files on your disk.");
- echo "\">";
- }
-echo "<meta name=\"content-language\" content=\"" .
- $languagecodes[$lang] . "\">";
-echo "<meta name=\"language\" content=\"" .
- $languagecodes[$lang] . "\">";
-?>
-<meta name="author" content="Christian Grothoff">
-<meta name="keywords"
content="doodle,desktop,search,suffix,tree,meta,data,libextractor,keywords,fam,index,database,free,Linux,GNU,GPL">
-<meta name="robots" content="index,follow">
-<meta name="revisit-after" content="28 days">
-<meta name="publisher" content="Christian Grothoff">
-<meta name="date" content="2004-12-31">
-<meta name="rights" content="(C) 2004 by Christian Grothoff>";
-<meta http-equiv="expires" content="43200">
-<meta http-equiv="content-type" content="text/html">
-</head>
-<body>
-<?php
-generateLanguageBar();
+$title="libextractor - a simple library for keyword extraction";
+$description="a simple library for keyword extraction";
+$email="address@hidden";
+$keywords="keyword, extraction, mp3, html, pdf, images, jpeg, gif, ps, mime,
real, qt, asf, mpeg, avi, riff, tiff, summary, summaries, kbps, format,
mime-type, zip, elf, doc, ppt, xls, sha-1, md5, open office, sxw, dvi, id3,
id3v2, id3v2.3, id3v2.4, thumbnails";
+$author="Vids Samanta and Christian Grothoff";
+$page="home";
+include("html_header.php3");
-H1("Doodle");
ANCHOR("about");
-H2("About");
+H2("About libextractor");
-W("Doodle is a tool to quickly search the documents on a computer.");
-W("Doodle builds an index using meta-data contained in the documents and
allows fast searches on the resulting database.");
-W("Doodle uses %s to support obtaining meta-data from various file-formats.",
- extlink_("/libextractor/","libextractor"));
-W("The database used by doodle is a %s, resulting in fast lookups.",
- extlink_("http://www.nist.gov/dads/HTML/suffixtree.html","suffix tree"));
-W("Doodle supports approximate searches.");
-BR();
-W("Features that Doodle does not have at the moment include:");
-echo "<ul>";
-LI("A web interface");
-LI("Ordering of search results");
-LI("Spidering (indexing the Internet or websites)");
-echo "</ul>";
-W("If you need these features, have a look at the %s section.",
- extlink_("#links", "links"));
-
+IMG("extractor_logo.png", "libextractor", "right", "136", "94", "0");
P();
-W("Doodle is licensed under the %s.",
- extlink_("http://www.gnu.org/licenses/gpl.html","GNU GPL"));
-W("Indexing large volumes can take several hundred MBs of memory (depending on
the amount of meta-data found).");
-W("Searching should nevertheless require almost no memory.");
-W("Using the latest version of libextractor is recommended.");
-W("Doodle has so far only been tested under %s and %s %s %s.",
- ARRAY(extlink_("http://www.debian.org/";, "Debian"),
- extlink_("http://www.redhat.com/";, "RedHat"),
- extlink_("http://www.gnu.org/";, "GNU"),
- extlink_("http://www.linux.org/";, "Linux")));
-W("Doodle is expected it to work under any platform supported by %s.",
- extlink_("/libextractor/", "libextractor"));
-P();
+W("libextractor is a library used to extract meta-data from files of arbitrary
type.");
+W("It is designed to use helper-libraries to perform the actual extraction,
and to be trivially extendable by linking against external extractors for
additional file types.");
+W("libextractor is part of the %s.",
+ extlink_("http://www.gnu.org/";, "GNU project"));
+//W("Our official GNU website can be found at %s.",
+//
extlink_("http://www.gnu.org/software/libextractor/","http://www.gnu.org/software/libextractor/";));
+W("libextractor can be downloaded from this site or the %s.",
+ extlink_("http://www.gnu.org/prep/ftp.html","GNU mirrors"));
-ANCHOR("download");
-H2("Download");
-W("You can find the current release %s.",
- extlink_("download/doodle-0.6.2.tar.gz", "here"));
-W("Man-pages for %s, %s and %s are also on-line.",
- ARRAY(extlink_("man/doodle.html", "doodle"),
- extlink_("man/doodled.html", "doodled"),
- extlink_("man/libdoodle", "libdoodle")));
-
-W("The latest version can be obtained using");
-PRE("$ svn checkout https://gnunet.org/svn/doodle/";);
-P();
-W("If you want to be notified about updates, subscribe to %s",
- extlink_("http://freshmeat.net/projects/doodle/";, "doodle on freshmeat"));
P();
-W("Debian packages provided by Daniel Baumann can be found %s.",
- extlink_("http://packages.debian.org/doodle";, "here"));
-W("RedHat/Fedora RPM packages provided by Dag Wieers can be found %s.",
- extlink_("http://dag.wieers.com/packages/doodle/","here";));
+W("The goal is to provide developers of file-sharing networks or WWW-indexing
bots with a universal library to obtain simple keywords to match against
queries.");
+W("libextractor contains a shell-command "extract" that, similar to
the well-known "file" command, can extract meta-data from a file an
print the results to stdout.");
P();
-ANCHOR("using");
-H2("Using doodle");
-W("First the doodle database needs to be created.");
-W("The simplest way to create the database is to run doodle with the
<tt>-b</tt> option on the directories that are to be indexed.");
-W("For example:");
-PRE("$ doodle -b $HOME");
-W("This will create the doodle database under <tt>~/.doodle</tt>.");
+W("Currently, libextractor supports the following formats:");
+include("plugins_list");
BR();
-W("After creating the doodle database, you can search it.");
-W("For example:");
-PRE("$ doodle keyword");
-BR();
-H3("Keeping the database up-to-date");
-W("If you want to keep your doodle database up-to-date, you can either
periodically re-run doodle with the <tt>-b</tt> option, or you can use doodled,
the doodle daemon.");
-W("doodled uses %s to notice whenever a file is changed and instantly updates
the doodle database.",
- "fam");
-W("In order to use doodled, you must have famd running.");
-W("If famd is running, you can start doodled by passing the same arguments
that you would pass to doodle to construct the database, but without the
<tt>-b</tt> option:");
-PRE("$ doodled $HOME");
-W("You can also use doodled to construct the initial database.");
-W("While doodled is updating the database, any doodle search will block until
the update is complete.");
-W("Note that while you may want to index your entire disk (i.e., <tt>doodle -b
/</tt>), it is typically not a great idea to have doodled monitor your entire
system for changes -- especially since <tt>/usr</tt> is unlikely to change
frequently.");
-W("You can address this issue by first indexing <tt>/</tt> and then using
doodled to monitor only directories that change frequently:");
-PRE("$ doodle -b /\n" .
- "$ doodled $HOME");
-W("This way, your entire system will be in the index, and your home directory
will be always up-to-date.");
+W("Also, various additional MIME types are detected.");
P();
-H3("Full-text search");
-W("You can achieve a (limited) form of full-text search with doodle.");
-W("For that, the dictionary-based plaintext extractors from %s are used.",
- extlink_("/libextractor/","libextractor"));
-W("In order to use them, you need to pass the option <tt>-b LANG</tt> to
doodle.");
-W("LANG is a two letter language code that selects the dictionary.");
-W("Available languages at the moment are en, es, fr, it and no.");
-W("Words and sentences that are available in the respective dictionaries for
these languages will then be added to the index.");
-W("While libextractor attempts to avoid full-text extraction for certain kown
binary formats, it may still find words in non-text files.");
-W("Running with this option will dramatically increase the size of the index
and the time it takes to build the index.");
-W("Note that if you change the options used to build a database will not (!)
result in doodle re-indexing files that were processed with other options
previously.");
-W("The only way to force doodle to re-index files with different options is to
either touch the files (change modification timestamp) or to delete the old
database and start from scratch.");
+W("libextractor is free software; you can redistribute it and/or modify it
under the terms of the GNU General Public License as published by the Free
Software Foundation; either version 2 of the License, or (at your option) any
later version.");
+ANCHOR("news");
+H2("Recent News");
P();
-H3("Hints for system administrators");
-W("If you are the system administrator, you might want to run doodle on the
entire system periodically (cron job) and have doodled monitor the home
directories in the background.");
-W("In that case, it is suggested to have the doodle database be group-readable
for a group doodle.");
-W("Set the permissions for the doodle binary to SGID to allow users to poll
the database.");
-W("Doodle will ensure that information about files not accessible to the user
are not leaked by checking if files found in the database are accessible to the
user.");
-W("doodled has to run as root since otherwise it would be impossible to index
the personal files of all users.");
-W("If that it too risky, doodled will still work, but only index the files
readable to the user that runs doodled.");
-
-
+echo "<dl>";
+DTDD("Thu Feb 24 01:23:31 EST 2005 | libextractor v0.4.2 released.",
+ "This release fixes some bugs in the ID3, PDF, PNG and REAL extractors.
The REAL extractor now also handles the new Helix formats. libextractor can
now also be used to extract thumbnails from images (using ImageMagick).");
+DTDD("Wed Jan 26 19:51:44 EST 2005 | libextractor v0.4.1 released.",
+ "This release fixes a security issue (inherited from xpdf). It also
extracts more meta-data from files of TAR or QuickTime format.");
+DTDD("Sat Dec 25 21:42:26 CET 2004 | libextractor v0.4.0 released.",
+ "This release improves support for character sets (plugins are now
expected to convert to UTF-8). It also improves support for mp3 (adding
genres) and png (handling of compressed comments).");
+DTDD("Sat Nov 13 13:23:23 EST 2004 | libextractor v0.3.11 released.",
+ "This release fixes bugs in the dvi, man, ID3v2.3, ole2 and pdf
extractors.");
+DTDD("Sun Oct 18 13:23:35 EST 2004 | libextractor v0.3.10 released.",
+ "This release adds support for ID3v2.3 and ID3v2.4. It fixes bugs in the
tar, man, deb, mp3 and ole2 extractors.");
+DTDD("Sat Oct 17 18:12:11 EST 2004 | libextractor v0.3.9 released.",
+ "This release adds support for the man, tar (including tar.gz) and deb
formats. It fixes bugs in the id3v2 and jpeg extractors. The size of jpeg
images is now also extracted. This version adds support for 64-bit file
sizes.");
+DTDD("Sat Oct 02 20:00:04 EST 2004 | libextractor v0.3.8 released.",
+ "This release adds support for dvi (from TeX). The plugins are now installed
in a separate plugin directory. libextractor now works under OS X (10.3).");
+DTDD("Fri Sep 23 23:30:33 EST 2004 | libextractor v0.3.7 released.",
+ "This release adds support for StarOffice formats, ID3v2 tags and the
Ripe160MD hash function. It also improves the performance of the HTML and ZIP
extractors.");
+DTDD("Fri Sep 10 20:10:38 EST 2004 | libextractor v0.3.6 released.",
+ "This release adds support for OpenOffice formats, hash functions (md5,
sha-1) and fixes some build problems.");
+DTDD("Mon Aug 30 23:18:49 IST 2004 | libextractor v0.3.5 released.",
+ "This release adds support for OLE2 (WinWord, PowerPoint, Excel formats)
and fixes various minor bugs. For OLE2 support you will have to have glib 2.0
installed (yes, that is glib from GTK/Gnome, not glibc!).");
+DTDD("Thu Aug 26 20:27:24 IST 2004 | Bugtracking using Mantis enabled.",
+ "You can now report and view bug-reports about libextractor on %s.",
+ extlink_("https://gnunet.org/mantis/","Mantis";));
+DTDD("Wed Aug 25 19:02:07 IST 2004 | libextractor v0.3.4 released.",
+ "This release fixes a minor linking error (<tt>-lm</tt> for
<tt>floor</tt>), improves performance and adds support for GNU gettext
(internationalization).");
+DTDD("Wed May 31 19:22:07 EST 2004 | libextractor v0.3.3 released.",
+ "This release fixes various minor bugs (segmentation faults and
non-termination of mpeg and riff extractors for malformed files) and adds
support for WAV files.");
+DTDD("Wed May 31 19:22:07 EST 2004 | libextractor v0.3.2 released.",
+ "This release fixes various minor bugs (plugins misbehaving for malformed
files) and improves portability to Cygwin/MinGW.");
+echo "</dl>";
P();
-H3("Using different options for different directories");
-W("You can build a database from multiple doodle runs over distinct sets of
files with different options.");
-W("For example, the following can make sense:");
-PRE("$ doodle -B en -b /usr/share/doc # full-text index over documentation\n" .
- "$ doodle -b /usr /opt /bin /lib # normal index over other system files\n"
.
- "$ doodled -B en /home # monitor /home, with full-text support\n");
-W("A simple doodle search will then find files in all listed directories.");
-W("You can also build multiple disjoint databases and search all of them in
one run (see %s for option <tt>-d</tt>).",
- extlink_("man/doodle.html", "doodle"));
+W("%s",
+ intlink_("oldnews","Older news archive"));
-P();
-ANCHOR("mantis");
-H2("Bugtrack");
-W("Doodle uses Mantis for bugtracking.");
-W("Visit %s to report bugs.",
- extlink_("https://gnunet.org/mantis/","https://gnunet.org/mantis/";));
-W("You need to sign up for a reporter account.");
-W("Please make sure you report bugs under <strong>Doodle</strong> and not
under any of the other projects.");
-P();
-W("If you dislike Mantis and need to report a bug contact %s via e-mail.",
- extlink_("mailto:address@hidden","address@hidden";));
-
-
ANCHOR("links");
H2("Links");
+P();
+W("Related work:");
echo "<ul>";
-LILI("http://members.cox.net/sinzui/medusa/";,
- "Medusa, similar project for Gnome");
-LILI("http://swish-e.org/";,
- "Swish-e, indexing tool with focus on the WWW");
-LILI("http://www.gnome.org/~seth/storage/";,
- "GNOME Storage");
-LILI("http://www.gnome.org/projects/beagle/";,
- "Beagle");
-LILI("http://sourceforge.net/projects/rlocate/";,
- "rlocate, version of locate that is always up-to-date");
-LILI("http://www.htdig.org/";,
- "HTDig");
-LILI("http://jakarta.apache.org/lucene/";,
- "Lucene");
-LILI("http://homepage.mac.com/pauljlucas/software/swish/";,
- "Swish++");
-LILI("http://webglimpse.net/";,
- "Glimpse");
-LILI("http://evidence.sf.net/";,
- "Evidence, file-manager with support for doodle");
-LILI("http://www.linux-magazin.de/Artikel/ausgabe/2004/09/bgw/bgw.html";,
- "Article about doodle (and other things) in the German Linux-Magazin");
+LILI("http://www.wotsit.org","File format database");
+LILI("http://getid3.sf.net/","getid3, similar project for PHP");
+LILI("download/php/",
+ "PHP wrapper for libextractor (mirrored, not written by us, see README)");
+LILI("http://dublincore.org/documents/dcmi-terms/","Meta-data categorization
standard");
+LILI("http://hul.harvard.edu/jhove/","JHOVE, Harvard Object Validation
Environment");
echo "</ul>";
-HR();
-echo "<address><a href=\"mailto:address@hidden";>Christian
Grothoff</a></address>";
-PRE("Copyright (C) 2004 Christian Grothoff.\n" .
- "Verbatim copying and distribution of this entire article\n" .
- "is permitted in any medium, provided this notice is preserved.");
-BR();
-generateFooter();
-echo "</body></html>\n";
+W("Projects that use libextractor:");
+echo "<ul>";
+LILI("http://witme.sourceforge.net/libferris.web/","libferris, a virtual file
system");
+LILI("http://evidence.sf.net/","Evidence, enlightened file manager");
+LILI("http://gnunet.org/","GNUnet, secure P2P file sharing");
+LILI("http://gnunet.org/doodle/","doodle, index your disk");
+echo "</ul>";
+
+ANCHOR("contact");
+H2("Contact");
+P();
+W("libextractor is developed by %s and %s.",
+ ARRAY(extlink_("http://grothoff.org/christian/";,
+ "Christian Grothoff"),
+ extlink_("http://compilers.cs.purdue.edu/~vids/";,
+ "Vids Samanta")));
+W("For questions about libextractor send email to %s.",
+ extlink_("mailto:address@hidden";,
+ "address@hidden"));
+
+include("html_footer.php3");
?>
+
Modified: GNUnet-docs/WWW/index.php
===================================================================
--- GNUnet-docs/WWW/index.php 2005-04-11 06:52:55 UTC (rev 647)
+++ GNUnet-docs/WWW/index.php 2005-04-11 06:58:51 UTC (rev 648)
@@ -1,199 +1,83 @@
<?php
-include("i18nhtml.inc");
-DOCTYPE("HTML", "Transitional");
-echo "<html><head>\n";
-if ($title) {
- echo "<title>";
- TRANSLATE("Doodle: find information on your computer");
- echo "</title>";
- }
-if ($description) {
- echo "<meta name=\"description\" content=\"";
- TRANSLATE("A tool to index and search the files on your disk.");
- echo "\">";
- }
-echo "<meta name=\"content-language\" content=\"" .
- $languagecodes[$lang] . "\">";
-echo "<meta name=\"language\" content=\"" .
- $languagecodes[$lang] . "\">";
-?>
-<meta name="author" content="Christian Grothoff">
-<meta name="keywords"
content="doodle,desktop,search,suffix,tree,meta,data,libextractor,keywords,fam,index,database,free,Linux,GNU,GPL">
-<meta name="robots" content="index,follow">
-<meta name="revisit-after" content="28 days">
-<meta name="publisher" content="Christian Grothoff">
-<meta name="date" content="2004-12-31">
-<meta name="rights" content="(C) 2004 by Christian Grothoff>";
-<meta http-equiv="expires" content="43200">
-<meta http-equiv="content-type" content="text/html">
-</head>
-<body>
-<?php
-generateLanguageBar();
+include("scripts.php3");
+$title = "GNUnet";
+$description="GNUnet - an anonymous distributed backup system :-)";
+include("html_header.php3");
-H1("Doodle");
-ANCHOR("about");
-H2("About");
+H2("About GNUnet");
+gnunetlogo();
-W("Doodle is a tool to quickly search the documents on a computer.");
-W("Doodle builds an index using meta-data contained in the documents and
allows fast searches on the resulting database.");
-W("Doodle uses %s to support obtaining meta-data from various file-formats.",
- extlink_("/libextractor/","libextractor"));
-W("The database used by doodle is a %s, resulting in fast lookups.",
- extlink_("http://www.nist.gov/dads/HTML/suffixtree.html","suffix tree"));
-W("Doodle supports approximate searches.");
-BR();
-W("Features that Doodle does not have at the moment include:");
-echo "<ul>";
-LI("A web interface");
-LI("Ordering of search results");
-LI("Spidering (indexing the Internet or websites)");
-echo "</ul>";
-W("If you need these features, have a look at the %s section.",
- extlink_("#links", "links"));
-
+W("GNUnet is a framework for secure peer-to-peer networking that does not use
any centralized or otherwise trusted services.");
+W("A first service implemented on top of the networking layer allows anonymous
censorship-resistant file-sharing.");
+W("GNUnet uses a simple, excess-based economic model to allocate resources.");
+W("Peers in GNUnet monitor each others behavior with respect to resource
usage; peers that contribute to the network are rewarded with better service.");
P();
-W("Doodle is licensed under the %s.",
- extlink_("http://www.gnu.org/licenses/gpl.html","GNU GPL"));
-W("Indexing large volumes can take several hundred MBs of memory (depending on
the amount of meta-data found).");
-W("Searching should nevertheless require almost no memory.");
-W("Using the latest version of libextractor is recommended.");
-W("Doodle has so far only been tested under %s and %s %s %s.",
- ARRAY(extlink_("http://www.debian.org/";, "Debian"),
- extlink_("http://www.redhat.com/";, "RedHat"),
- extlink_("http://www.gnu.org/";, "GNU"),
- extlink_("http://www.linux.org/";, "Linux")));
-W("Doodle is expected it to work under any platform supported by %s.",
- extlink_("/libextractor/", "libextractor"));
-P();
-ANCHOR("download");
-H2("Download");
-W("You can find the current release %s.",
- extlink_("download/doodle-0.6.2.tar.gz", "here"));
-W("Man-pages for %s, %s and %s are also on-line.",
- ARRAY(extlink_("man/doodle.html", "doodle"),
- extlink_("man/doodled.html", "doodled"),
- extlink_("man/libdoodle", "libdoodle")));
+W("GNUnet is part of the %s.",
+ extlink_("http://www.gnu.org/","GNU project"));
+W("Our official GNU website can be found at %s.",
+
extlink_("http://www.gnu.org/software/gnunet/","http://www.gnu.org/software/gnunet/";));
+W("GNUnet can be downloaded from this site or the %s.",
+ extlink_("http://www.gnu.org/prep/ftp.html","GNU mirrors"));
-W("The latest version can be obtained using");
-PRE("$ svn checkout https://gnunet.org/svn/doodle/";);
-P();
-W("If you want to be notified about updates, subscribe to %s",
- extlink_("http://freshmeat.net/projects/doodle/";, "doodle on freshmeat"));
P();
-W("Debian packages provided by Daniel Baumann can be found %s.",
- extlink_("http://packages.debian.org/doodle";, "here"));
-W("RedHat/Fedora RPM packages provided by Dag Wieers can be found %s.",
- extlink_("http://dag.wieers.com/packages/doodle/","here";));
-P();
+H2("News");
+W("Older news can be found %s.\n",
+ intlink_("old_news.php3", "here"));
+echo "<dl>\n";
-ANCHOR("using");
-H2("Using doodle");
-W("First the doodle database needs to be created.");
-W("The simplest way to create the database is to run doodle with the
<tt>-b</tt> option on the directories that are to be indexed.");
-W("For example:");
-PRE("$ doodle -b $HOME");
-W("This will create the doodle database under <tt>~/.doodle</tt>.");
-BR();
-W("After creating the doodle database, you can search it.");
-W("For example:");
-PRE("$ doodle keyword");
-BR();
-H3("Keeping the database up-to-date");
-W("If you want to keep your doodle database up-to-date, you can either
periodically re-run doodle with the <tt>-b</tt> option, or you can use doodled,
the doodle daemon.");
-W("doodled uses %s to notice whenever a file is changed and instantly updates
the doodle database.",
- "fam");
-W("In order to use doodled, you must have famd running.");
-W("If famd is running, you can start doodled by passing the same arguments
that you would pass to doodle to construct the database, but without the
<tt>-b</tt> option:");
-PRE("$ doodled $HOME");
-W("You can also use doodled to construct the initial database.");
-W("While doodled is updating the database, any doodle search will block until
the update is complete.");
-W("Note that while you may want to index your entire disk (i.e., <tt>doodle -b
/</tt>), it is typically not a great idea to have doodled monitor your entire
system for changes -- especially since <tt>/usr</tt> is unlikely to change
frequently.");
-W("You can address this issue by first indexing <tt>/</tt> and then using
doodled to monitor only directories that change frequently:");
-PRE("$ doodle -b /\n" .
- "$ doodled $HOME");
-W("This way, your entire system will be in the index, and your home directory
will be always up-to-date.");
-P();
-H3("Full-text search");
-W("You can achieve a (limited) form of full-text search with doodle.");
-W("For that, the dictionary-based plaintext extractors from %s are used.",
- extlink_("/libextractor/","libextractor"));
-W("In order to use them, you need to pass the option <tt>-b LANG</tt> to
doodle.");
-W("LANG is a two letter language code that selects the dictionary.");
-W("Available languages at the moment are en, es, fr, it and no.");
-W("Words and sentences that are available in the respective dictionaries for
these languages will then be added to the index.");
-W("While libextractor attempts to avoid full-text extraction for certain kown
binary formats, it may still find words in non-text files.");
-W("Running with this option will dramatically increase the size of the index
and the time it takes to build the index.");
-W("Note that if you change the options used to build a database will not (!)
result in doodle re-indexing files that were processed with other options
previously.");
-W("The only way to force doodle to re-index files with different options is to
either touch the files (change modification timestamp) or to delete the old
database and start from scratch.");
+function convert_time($mysql_timestamp){
+if (ereg("^([0-9]{4})([0-9]{2})([0-9]{2})([0-9]{2})" .
+ "([0-9]{2})([0-9]{2})",$mysql_timestamp,$res)):
+ $year=$res[1];
+ $month=$res[2];
+ $day=$res[3];
+ $hour=$res[4];
+ $min=$res[5];
+ $sec=$res[6];
-P();
-H3("Hints for system administrators");
-W("If you are the system administrator, you might want to run doodle on the
entire system periodically (cron job) and have doodled monitor the home
directories in the background.");
-W("In that case, it is suggested to have the doodle database be group-readable
for a group doodle.");
-W("Set the permissions for the doodle binary to SGID to allow users to poll
the database.");
-W("Doodle will ensure that information about files not accessible to the user
are not leaked by checking if files found in the database are accessible to the
user.");
-W("doodled has to run as root since otherwise it would be impossible to index
the personal files of all users.");
-W("If that it too risky, doodled will still work, but only index the files
readable to the user that runs doodled.");
+ return(array($year,$month,$day,$hour,$min,$sec));
+ else:
+ return(false);
+ endif;
+}
-
+// definition: news is what is less than 3 months old :-)
+$query = "SELECT title,include,posted FROM news " .
+ "WHERE TO_DAYS(NOW())-TO_DAYS(posted) < 90 " .
+ "ORDER BY posted DESC";
+$result = mysql_query($query, $connection);
+$num = 0;
+if ($result) {
+ $num = mysql_numrows($result);
+}
+for ($i=0;$i<$num;$i++) {
+ $row = mysql_fetch_array($result);
+ $pd = convert_time($row["posted"]);
+ echo "<dt>" . $pd[0] . "-" . $pd[1] . "-" . $pd[2] . ": " .
W_($row["title"]) . "</dt>\n";
+ echo "<dd>\n";
+ include($row["include"]);
+ echo "</dd>\n";
+}
+echo "</dl>\n";
P();
-H3("Using different options for different directories");
-W("You can build a database from multiple doodle runs over distinct sets of
files with different options.");
-W("For example, the following can make sense:");
-PRE("$ doodle -B en -b /usr/share/doc # full-text index over documentation\n" .
- "$ doodle -b /usr /opt /bin /lib # normal index over other system files\n"
.
- "$ doodled -B en /home # monitor /home, with full-text support\n");
-W("A simple doodle search will then find files in all listed directories.");
-W("You can also build multiple disjoint databases and search all of them in
one run (see %s for option <tt>-d</tt>).",
- extlink_("man/doodle.html", "doodle"));
-
+H2("Roadmap");
+W("Here is the current development plan:");
+echo "<ul>\n";
+LI("fix %s",
+ extlink_("https://gnunet.org/mantis/","bugs";));
+LI("improve handling of pseudonyms (manage reputation in namespaces)");
+LI("add testbed harness to allow automated testing and profiling (%s)",
+ extlink_("mailto:address@hidden","contact";));
+LI("extend GTK UI (delete, statistics, configuration, recursive insertion)");
+LI("add download-daemon that manages ongoing/completed/stalled downloads");
+echo "</ul>\n";
P();
-ANCHOR("mantis");
-H2("Bugtrack");
-W("Doodle uses Mantis for bugtracking.");
-W("Visit %s to report bugs.",
- extlink_("https://gnunet.org/mantis/","https://gnunet.org/mantis/";));
-W("You need to sign up for a reporter account.");
-W("Please make sure you report bugs under <strong>Doodle</strong> and not
under any of the other projects.");
-P();
-W("If you dislike Mantis and need to report a bug contact %s via e-mail.",
- extlink_("mailto:address@hidden","address@hidden";));
+H2("Contact");
+W("GNUnet is developed by %s.",
+ extlink_("http://www.gnu.org/software/gnunet/","the GNUnet developers"));
+W("For questions about GNUnet send E-Mail to %s.",
+ extlink_("mailto:address@hidden","address@hidden";));
-
-ANCHOR("links");
-H2("Links");
-echo "<ul>";
-LILI("http://members.cox.net/sinzui/medusa/";,
- "Medusa, similar project for Gnome");
-LILI("http://swish-e.org/";,
- "Swish-e, indexing tool with focus on the WWW");
-LILI("http://www.gnome.org/~seth/storage/";,
- "GNOME Storage");
-LILI("http://www.gnome.org/projects/beagle/";,
- "Beagle");
-LILI("http://sourceforge.net/projects/rlocate/";,
- "rlocate, version of locate that is always up-to-date");
-LILI("http://www.htdig.org/";,
- "HTDig");
-LILI("http://jakarta.apache.org/lucene/";,
- "Lucene");
-LILI("http://homepage.mac.com/pauljlucas/software/swish/";,
- "Swish++");
-LILI("http://webglimpse.net/";,
- "Glimpse");
-LILI("http://evidence.sf.net/";,
- "Evidence, file-manager with support for doodle");
-LILI("http://www.linux-magazin.de/Artikel/ausgabe/2004/09/bgw/bgw.html";,
- "Article about doodle (and other things) in the German Linux-Magazin");
-echo "</ul>";
-HR();
-echo "<address><a href=\"mailto:address@hidden";>Christian
Grothoff</a></address>";
-PRE("Copyright (C) 2004 Christian Grothoff.\n" .
- "Verbatim copying and distribution of this entire article\n" .
- "is permitted in any medium, provided this notice is preserved.");
-BR();
-generateFooter();
-echo "</body></html>\n";
+include("html_footer.php3");
?>
Added: i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.bz2
===================================================================
(Binary files differ)
Property changes on: i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.bz2
___________________________________________________________________
Name: svn:mime-type
+ application/octet-stream
Added: i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.gz
===================================================================
(Binary files differ)
Property changes on: i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.gz
___________________________________________________________________
Name: svn:mime-type
+ application/octet-stream
Modified: i18nHTML-docs/WWW/index.php
===================================================================
--- i18nHTML-docs/WWW/index.php 2005-04-11 06:52:55 UTC (rev 647)
+++ i18nHTML-docs/WWW/index.php 2005-04-11 06:58:51 UTC (rev 648)
@@ -2,198 +2,84 @@
include("i18nhtml.inc");
DOCTYPE("HTML", "Transitional");
echo "<html><head>\n";
-if ($title) {
- echo "<title>";
- TRANSLATE("Doodle: find information on your computer");
- echo "</title>";
- }
-if ($description) {
- echo "<meta name=\"description\" content=\"";
- TRANSLATE("A tool to index and search the files on your disk.");
- echo "\">";
- }
-echo "<meta name=\"content-language\" content=\"" .
- $languagecodes[$lang] . "\">";
-echo "<meta name=\"language\" content=\"" .
- $languagecodes[$lang] . "\">";
+TITLE("i18nHTML - enabling collaborative webpage translation");
+echo "<meta name=\"description\" content=\"";
+TRANSLATE("i18nHTML is a collection of PHP scripts that allow visitors of a
webpage to help translating it.");
+echo "\">";
?>
<meta name="author" content="Christian Grothoff">
-<meta name="keywords"
content="doodle,desktop,search,suffix,tree,meta,data,libextractor,keywords,fam,index,database,free,Linux,GNU,GPL">
+<meta name="keywords"
content="i18n,HTML,PHP,translation,languages,mysql,database,internationalization,www,free,GNU,GPL">
<meta name="robots" content="index,follow">
<meta name="revisit-after" content="28 days">
<meta name="publisher" content="Christian Grothoff">
-<meta name="date" content="2004-12-31">
-<meta name="rights" content="(C) 2004 by Christian Grothoff>";
+<meta name="date" content="2005-01-03">
+<meta name="rights" content="(C) 2004,2005 by Christian Grothoff>";
<meta http-equiv="expires" content="43200">
<meta http-equiv="content-type" content="text/html">
</head>
<body>
<?php
generateLanguageBar();
-
-H1("Doodle");
-ANCHOR("about");
+H1("i18nHTML");
H2("About");
-
-W("Doodle is a tool to quickly search the documents on a computer.");
-W("Doodle builds an index using meta-data contained in the documents and
allows fast searches on the resulting database.");
-W("Doodle uses %s to support obtaining meta-data from various file-formats.",
- extlink_("/libextractor/","libextractor"));
-W("The database used by doodle is a %s, resulting in fast lookups.",
- extlink_("http://www.nist.gov/dads/HTML/suffixtree.html","suffix tree"));
-W("Doodle supports approximate searches.");
-BR();
-W("Features that Doodle does not have at the moment include:");
-echo "<ul>";
-LI("A web interface");
-LI("Ordering of search results");
-LI("Spidering (indexing the Internet or websites)");
-echo "</ul>";
-W("If you need these features, have a look at the %s section.",
- extlink_("#links", "links"));
-
+W("i18nHTML is a collection of PHP files that can be used to write webpages
that visitors can translate into their respective native languages.");
+W("i18nHTML uses a database to match sentences from the webpage against
translations.");
+W("i18nHTML defines a set of PHP functions that generate either the translated
HTML sentences or the original (typically English) text with decorations that
allow users to provide translations.");
+W("i18nHTML requires the internationalized webpages to be written using the
provided PHP functions but does not constrain the page design in any way.");
+W("Webpages internationalized with i18nHTML can be updated without loosing
existing translations for sentences that were not changed.");
+W("Note that it is important that you use the i18nHTML <tt>TITLE</tt> command
in your documents in order to ensure that the character set and other meta-data
is set properly.");
P();
-W("Doodle is licensed under the %s.",
- extlink_("http://www.gnu.org/licenses/gpl.html","GNU GPL"));
-W("Indexing large volumes can take several hundred MBs of memory (depending on
the amount of meta-data found).");
-W("Searching should nevertheless require almost no memory.");
-W("Using the latest version of libextractor is recommended.");
-W("Doodle has so far only been tested under %s and %s %s %s.",
- ARRAY(extlink_("http://www.debian.org/";, "Debian"),
- extlink_("http://www.redhat.com/";, "RedHat"),
- extlink_("http://www.gnu.org/";, "GNU"),
- extlink_("http://www.linux.org/";, "Linux")));
-W("Doodle is expected it to work under any platform supported by %s.",
- extlink_("/libextractor/", "libextractor"));
+H2("News");
+H3("i18nHTML 0.1.0 released");
+W("i18nHTML 0.1.0 is expected to solve various character set encoding
issues.");
+W("It also ensures that all entered translations match the original sentence
in the number of escape sequences.");
+W("The new version also resolves various minor bugs (such as editor mode only
working with php-register-globals enabled).");
P();
-
-ANCHOR("download");
+W("Upgrading from i18nHTML 0.0.2 to 0.1.0 requires changes to the encoding of
strings in the database (which is now hopefully properly based on unicode).");
+W("This can be done by running the update.php script and feeding the SQL
statements that update.php generates into MySQL.");
+W("Running <tt>update.php</tt> by itself will not do the data conversion (for
security reasons).");
+W("You should backup your old translation database first.");
+W("mysqldump should be useful here.");
+W("Note that <tt>update.php</tt> may discard translations that it believes
have serious character set (or other) problems.");
+W("The total number of discarded translations can be found at the end of the
output (in a generated comment).");
+P();
+W("Another important step in upgrading from 0.0.2 to 0.1.0 is to use the new
<tt>TITLE</tt> function to generate the title of all webpages.");
+W("The reason is that the <tt>TITLE</tt> function will generate other HTML
tags that should be placed in the HTML header to help ensure that the browser
picks up the character encodings correctly.");
+P();
H2("Download");
-W("You can find the current release %s.",
- extlink_("download/doodle-0.6.2.tar.gz", "here"));
-W("Man-pages for %s, %s and %s are also on-line.",
- ARRAY(extlink_("man/doodle.html", "doodle"),
- extlink_("man/doodled.html", "doodled"),
- extlink_("man/libdoodle", "libdoodle")));
-
-W("The latest version can be obtained using");
-PRE("$ svn checkout https://gnunet.org/svn/doodle/";);
+W("You can find the latest version %s.",
+ extlink_("https://gnunet.org/i18nHTML/download/";, "here"));
+W("The latest SVN version can be obtained using");
+PRE("$ svn checkout https://gnunet.org/svn/i18nHTML/";);
P();
W("If you want to be notified about updates, subscribe to %s",
- extlink_("http://freshmeat.net/projects/doodle/";, "doodle on freshmeat"));
+ extlink_("http://freshmeat.net/projects/i18nHTML/";, "i18nHTML on
freshmeat"));
P();
-W("Debian packages provided by Daniel Baumann can be found %s.",
- extlink_("http://packages.debian.org/doodle";, "here"));
-W("RedHat/Fedora RPM packages provided by Dag Wieers can be found %s.",
- extlink_("http://dag.wieers.com/packages/doodle/","here";));
-P();
-ANCHOR("using");
-H2("Using doodle");
-W("First the doodle database needs to be created.");
-W("The simplest way to create the database is to run doodle with the
<tt>-b</tt> option on the directories that are to be indexed.");
-W("For example:");
-PRE("$ doodle -b $HOME");
-W("This will create the doodle database under <tt>~/.doodle</tt>.");
-BR();
-W("After creating the doodle database, you can search it.");
-W("For example:");
-PRE("$ doodle keyword");
-BR();
-H3("Keeping the database up-to-date");
-W("If you want to keep your doodle database up-to-date, you can either
periodically re-run doodle with the <tt>-b</tt> option, or you can use doodled,
the doodle daemon.");
-W("doodled uses %s to notice whenever a file is changed and instantly updates
the doodle database.",
- "fam");
-W("In order to use doodled, you must have famd running.");
-W("If famd is running, you can start doodled by passing the same arguments
that you would pass to doodle to construct the database, but without the
<tt>-b</tt> option:");
-PRE("$ doodled $HOME");
-W("You can also use doodled to construct the initial database.");
-W("While doodled is updating the database, any doodle search will block until
the update is complete.");
-W("Note that while you may want to index your entire disk (i.e., <tt>doodle -b
/</tt>), it is typically not a great idea to have doodled monitor your entire
system for changes -- especially since <tt>/usr</tt> is unlikely to change
frequently.");
-W("You can address this issue by first indexing <tt>/</tt> and then using
doodled to monitor only directories that change frequently:");
-PRE("$ doodle -b /\n" .
- "$ doodled $HOME");
-W("This way, your entire system will be in the index, and your home directory
will be always up-to-date.");
-P();
-H3("Full-text search");
-W("You can achieve a (limited) form of full-text search with doodle.");
-W("For that, the dictionary-based plaintext extractors from %s are used.",
- extlink_("/libextractor/","libextractor"));
-W("In order to use them, you need to pass the option <tt>-b LANG</tt> to
doodle.");
-W("LANG is a two letter language code that selects the dictionary.");
-W("Available languages at the moment are en, es, fr, it and no.");
-W("Words and sentences that are available in the respective dictionaries for
these languages will then be added to the index.");
-W("While libextractor attempts to avoid full-text extraction for certain kown
binary formats, it may still find words in non-text files.");
-W("Running with this option will dramatically increase the size of the index
and the time it takes to build the index.");
-W("Note that if you change the options used to build a database will not (!)
result in doodle re-indexing files that were processed with other options
previously.");
-W("The only way to force doodle to re-index files with different options is to
either touch the files (change modification timestamp) or to delete the old
database and start from scratch.");
-P();
-H3("Hints for system administrators");
-W("If you are the system administrator, you might want to run doodle on the
entire system periodically (cron job) and have doodled monitor the home
directories in the background.");
-W("In that case, it is suggested to have the doodle database be group-readable
for a group doodle.");
-W("Set the permissions for the doodle binary to SGID to allow users to poll
the database.");
-W("Doodle will ensure that information about files not accessible to the user
are not leaked by checking if files found in the database are accessible to the
user.");
-W("doodled has to run as root since otherwise it would be impossible to index
the personal files of all users.");
-W("If that it too risky, doodled will still work, but only index the files
readable to the user that runs doodled.");
-
P();
-H3("Using different options for different directories");
-W("You can build a database from multiple doodle runs over distinct sets of
files with different options.");
-W("For example, the following can make sense:");
-PRE("$ doodle -B en -b /usr/share/doc # full-text index over documentation\n" .
- "$ doodle -b /usr /opt /bin /lib # normal index over other system files\n"
.
- "$ doodled -B en /home # monitor /home, with full-text support\n");
-W("A simple doodle search will then find files in all listed directories.");
-W("You can also build multiple disjoint databases and search all of them in
one run (see %s for option <tt>-d</tt>).",
- extlink_("man/doodle.html", "doodle"));
+if ( ($xlang) && ($xlang != "English")) {
+ H2("Mass translation");
+ W("The mass-translation page for translating many sentences at once is %s.",
+ intlink_("editor.php", "here"));
+ W("Note that the sentence database is shared with the %s, %s and %s
projects.",
+ ARRAY(extlink_("http://gnunet.org/";, "GNUnet"),
+ extlink_("http://gnunet.org/doodle/";, "doodle"),
+ extlink_("http://gnunet.org/libextractor/";, "libExtractor")));
+ }
-P();
-ANCHOR("mantis");
H2("Bugtrack");
-W("Doodle uses Mantis for bugtracking.");
+W("i18nHTML uses Mantis for bugtracking.");
W("Visit %s to report bugs.",
extlink_("https://gnunet.org/mantis/","https://gnunet.org/mantis/";));
W("You need to sign up for a reporter account.");
-W("Please make sure you report bugs under <strong>Doodle</strong> and not
under any of the other projects.");
+W("Please make sure you report bugs under <strong>I18nHTML</strong> and not
under any of the other projects.");
P();
-W("If you dislike Mantis and need to report a bug contact %s via e-mail.",
+W("If you dislike Mantis and need to report a bug contact %s via e-mail (good
luck getting by the spam-filter).",
extlink_("mailto:address@hidden","address@hidden";));
-
-ANCHOR("links");
-H2("Links");
-echo "<ul>";
-LILI("http://members.cox.net/sinzui/medusa/";,
- "Medusa, similar project for Gnome");
-LILI("http://swish-e.org/";,
- "Swish-e, indexing tool with focus on the WWW");
-LILI("http://www.gnome.org/~seth/storage/";,
- "GNOME Storage");
-LILI("http://www.gnome.org/projects/beagle/";,
- "Beagle");
-LILI("http://sourceforge.net/projects/rlocate/";,
- "rlocate, version of locate that is always up-to-date");
-LILI("http://www.htdig.org/";,
- "HTDig");
-LILI("http://jakarta.apache.org/lucene/";,
- "Lucene");
-LILI("http://homepage.mac.com/pauljlucas/software/swish/";,
- "Swish++");
-LILI("http://webglimpse.net/";,
- "Glimpse");
-LILI("http://evidence.sf.net/";,
- "Evidence, file-manager with support for doodle");
-LILI("http://www.linux-magazin.de/Artikel/ausgabe/2004/09/bgw/bgw.html";,
- "Article about doodle (and other things) in the German Linux-Magazin");
-echo "</ul>";
HR();
-echo "<address><a href=\"mailto:address@hidden";>Christian
Grothoff</a></address>";
-PRE("Copyright (C) 2004 Christian Grothoff.\n" .
- "Verbatim copying and distribution of this entire article\n" .
- "is permitted in any medium, provided this notice is preserved.");
-BR();
generateFooter();
echo "</body></html>\n";
?>
[Prev in Thread] |
Current Thread |
[Next in Thread] |
- [GNUnet-SVN] r648 - Extractor-docs/WWW GNUnet-docs/WWW i18nHTML-docs/WWW i18nHTML-docs/WWW/download,
grothoff <=