gnunet-svn
[Top][All Lists]
Advanced

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

[GNUnet-SVN] r648 - Extractor-docs/WWW GNUnet-docs/WWW i18nHTML-docs/WWW


From: grothoff
Subject: [GNUnet-SVN] r648 - Extractor-docs/WWW GNUnet-docs/WWW i18nHTML-docs/WWW i18nHTML-docs/WWW/download
Date: Sun, 10 Apr 2005 23:58:58 -0700 (PDT)

Author: grothoff
Date: 2005-04-10 23:58:51 -0700 (Sun, 10 Apr 2005)
New Revision: 648

Added:
   i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.bz2
   i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.gz
Modified:
   Extractor-docs/WWW/index.php
   GNUnet-docs/WWW/index.php
   i18nHTML-docs/WWW/index.php
Log:
revert

Modified: Extractor-docs/WWW/index.php
===================================================================
--- Extractor-docs/WWW/index.php        2005-04-11 06:52:55 UTC (rev 647)
+++ Extractor-docs/WWW/index.php        2005-04-11 06:58:51 UTC (rev 648)
@@ -1,199 +1,108 @@
 <?php
-include("i18nhtml.inc");
-DOCTYPE("HTML", "Transitional");
-echo "<html><head>\n";
-if ($title) {
-  echo "<title>";
-  TRANSLATE("Doodle: find information on your computer");
-  echo "</title>";
- }
-if ($description) {
-  echo "<meta name=\"description\" content=\"";
-  TRANSLATE("A tool to index and search the files on your disk.");
-  echo "\">";
- }
-echo "<meta name=\"content-language\" content=\"" . 
-     $languagecodes[$lang] . "\">";
-echo "<meta name=\"language\" content=\"" . 
-     $languagecodes[$lang] . "\">";
-?>
-<meta name="author" content="Christian Grothoff">
-<meta name="keywords" 
content="doodle,desktop,search,suffix,tree,meta,data,libextractor,keywords,fam,index,database,free,Linux,GNU,GPL">
-<meta name="robots" content="index,follow">
-<meta name="revisit-after" content="28 days">
-<meta name="publisher" content="Christian Grothoff">
-<meta name="date" content="2004-12-31">
-<meta name="rights" content="(C) 2004 by Christian Grothoff>";
-<meta http-equiv="expires" content="43200">
-<meta http-equiv="content-type" content="text/html">
-</head>
-<body>
-<?php
-generateLanguageBar();
+$title="libextractor - a simple library for keyword extraction";
+$description="a simple library for keyword extraction";
+$email="address@hidden";       
+$keywords="keyword, extraction, mp3, html, pdf, images, jpeg, gif, ps, mime, 
real, qt, asf, mpeg, avi, riff, tiff, summary, summaries, kbps, format, 
mime-type, zip, elf, doc, ppt, xls, sha-1, md5, open office, sxw, dvi, id3, 
id3v2, id3v2.3, id3v2.4, thumbnails";
+$author="Vids Samanta and Christian Grothoff"; 
+$page="home";  
+include("html_header.php3");
 
-H1("Doodle");
 ANCHOR("about");
-H2("About");
+H2("About libextractor");
 
-W("Doodle is a tool to quickly search the documents on a computer.");
-W("Doodle builds an index using meta-data contained in the documents and 
allows fast searches on the resulting database.");
-W("Doodle uses %s to support obtaining meta-data from various file-formats.",
-  extlink_("/libextractor/","libextractor"));
-W("The database used by doodle is a %s, resulting in fast lookups.",
-  extlink_("http://www.nist.gov/dads/HTML/suffixtree.html","suffix tree"));
-W("Doodle supports approximate searches.");
-BR();
-W("Features that Doodle does not have at the moment include:");
-echo "<ul>";
-LI("A web interface");
-LI("Ordering of search results");
-LI("Spidering (indexing the Internet or websites)");
-echo "</ul>";
-W("If you need these features, have a look at the %s section.",
-  extlink_("#links", "links"));
-
+IMG("extractor_logo.png", "libextractor", "right", "136", "94", "0");
 P();
-W("Doodle is licensed under the %s.",
-  extlink_("http://www.gnu.org/licenses/gpl.html","GNU GPL"));
-W("Indexing large volumes can take several hundred MBs of memory (depending on 
the amount of meta-data found).");
-W("Searching should nevertheless require almost no memory.");
-W("Using the latest version of libextractor is recommended.");
-W("Doodle has so far only been tested under %s and %s %s %s.",
-  ARRAY(extlink_("http://www.debian.org/";, "Debian"),
-        extlink_("http://www.redhat.com/";, "RedHat"),
-        extlink_("http://www.gnu.org/";, "GNU"),
-        extlink_("http://www.linux.org/";, "Linux")));
-W("Doodle is expected it to work under any platform supported by %s.",
-  extlink_("/libextractor/", "libextractor"));
-P();
+W("libextractor is a library used to extract meta-data from files of arbitrary 
type.");
+W("It is designed to use helper-libraries to perform the actual extraction, 
and to be trivially extendable by linking against external extractors for 
additional file types.");
+W("libextractor is part of the %s.",
+  extlink_("http://www.gnu.org/";, "GNU project"));
+//W("Our official GNU website can be found at %s.",
+//  
extlink_("http://www.gnu.org/software/libextractor/","http://www.gnu.org/software/libextractor/";));
+W("libextractor can be downloaded from this site or the %s.",
+  extlink_("http://www.gnu.org/prep/ftp.html","GNU mirrors"));
 
-ANCHOR("download");
-H2("Download");
-W("You can find the current release %s.",
-  extlink_("download/doodle-0.6.2.tar.gz", "here"));
-W("Man-pages for %s, %s and %s are also on-line.",
-  ARRAY(extlink_("man/doodle.html", "doodle"),
-        extlink_("man/doodled.html", "doodled"),
-        extlink_("man/libdoodle", "libdoodle")));
-
-W("The latest version can be obtained using");
-PRE("$ svn checkout https://gnunet.org/svn/doodle/";);
-P();    
-W("If you want to be notified about updates, subscribe to %s",
-  extlink_("http://freshmeat.net/projects/doodle/";, "doodle on freshmeat"));
 P();
-W("Debian packages provided by Daniel Baumann can be found %s.",
-  extlink_("http://packages.debian.org/doodle";, "here"));
-W("RedHat/Fedora RPM packages provided by Dag Wieers can be found %s.",
-  extlink_("http://dag.wieers.com/packages/doodle/","here";));
+W("The goal is to provide developers of file-sharing networks or WWW-indexing 
bots with a universal library to obtain simple keywords to match against 
queries.");
+W("libextractor contains a shell-command &quot;extract&quot; that, similar to 
the well-known &quot;file&quot; command, can extract meta-data from a file an 
print the results to stdout.");
 P();
 
-ANCHOR("using");
-H2("Using doodle");
-W("First the doodle database needs to be created.");
-W("The simplest way to create the database is to run doodle with the 
<tt>-b</tt> option on the directories that are to be indexed.");
-W("For example:");
-PRE("$ doodle -b $HOME");
-W("This will create the doodle database under <tt>~/.doodle</tt>.");
+W("Currently, libextractor supports the following formats:");
+include("plugins_list");
 BR();
-W("After creating the doodle database, you can search it.");
-W("For example:");
-PRE("$ doodle keyword");
-BR();
-H3("Keeping the database up-to-date");
-W("If you want to keep your doodle database up-to-date, you can either 
periodically re-run doodle with the <tt>-b</tt> option, or you can use doodled, 
the doodle daemon.");
-W("doodled uses %s to notice whenever a file is changed and instantly updates 
the doodle database.",
-  "fam");
-W("In order to use doodled, you must have famd running.");
-W("If famd is running, you can start doodled by passing the same arguments 
that you would pass to doodle to construct the database, but without the 
<tt>-b</tt> option:");
-PRE("$ doodled $HOME");
-W("You can also use doodled to construct the initial database.");
-W("While doodled is updating the database, any doodle search will block until 
the update is complete.");
-W("Note that while you may want to index your entire disk (i.e., <tt>doodle -b 
/</tt>), it is typically not a great idea to have doodled monitor your entire 
system for changes -- especially since <tt>/usr</tt> is unlikely to change 
frequently.");
-W("You can address this issue by first indexing <tt>/</tt> and then using 
doodled to monitor only directories that change frequently:");
-PRE("$ doodle -b /\n" .
-    "$ doodled $HOME");
-W("This way, your entire system will be in the index, and your home directory 
will be always up-to-date.");
+W("Also, various additional MIME types are detected.");
 P();
-H3("Full-text search");
-W("You can achieve a (limited) form of full-text search with doodle.");
-W("For that, the dictionary-based plaintext extractors from %s are used.",
-  extlink_("/libextractor/","libextractor"));
-W("In order to use them, you need to pass the option <tt>-b LANG</tt> to 
doodle.");
-W("LANG is a two letter language code that selects the dictionary.");
-W("Available languages at the moment are en, es, fr, it and no.");
-W("Words and sentences that are available in the respective dictionaries for 
these languages will then be added to the index.");
-W("While libextractor attempts to avoid full-text extraction for certain kown 
binary formats, it may still find words in non-text files.");
-W("Running with this option will dramatically increase the size of the index 
and the time it takes to build the index.");
-W("Note that if you change the options used to build a database will not (!) 
result in doodle re-indexing files that were processed with other options 
previously.");
-W("The only way to force doodle to re-index files with different options is to 
either touch the files (change modification timestamp) or to delete the old 
database and start from scratch.");
 
+W("libextractor is free software; you can redistribute it and/or modify it 
under the terms of the GNU General Public License as published by the Free 
Software Foundation; either version 2 of the License, or (at your option) any 
later version.");
+ANCHOR("news");
+H2("Recent News");
 P();
-H3("Hints for system administrators");
-W("If you are the system administrator, you might want to run doodle on the 
entire system periodically (cron job) and have doodled monitor the home 
directories in the background.");
-W("In that case, it is suggested to have the doodle database be group-readable 
for a group doodle.");
-W("Set the permissions for the doodle binary to SGID to allow users to poll 
the database.");
-W("Doodle will ensure that information about files not accessible to the user 
are not leaked by checking if files found in the database are accessible to the 
user.");
-W("doodled has to run as root since otherwise it would be impossible to index 
the personal files of all users.");
-W("If that it too risky, doodled will still work, but only index the files 
readable to the user that runs doodled.");
-
-
+echo "<dl>";
+DTDD("Thu Feb 24 01:23:31 EST 2005 | libextractor v0.4.2 released.",
+     "This release fixes some bugs in the ID3, PDF, PNG and REAL extractors.  
The REAL extractor now also handles the new Helix formats.  libextractor can 
now also be used to extract thumbnails from images (using ImageMagick).");
+DTDD("Wed Jan 26 19:51:44 EST 2005 | libextractor v0.4.1 released.",
+     "This release fixes a security issue (inherited from xpdf).  It also 
extracts more meta-data from files of TAR or QuickTime format.");
+DTDD("Sat Dec 25 21:42:26 CET 2004 | libextractor v0.4.0 released.",
+     "This release improves support for character sets (plugins are now 
expected to convert to UTF-8).  It also improves support for mp3 (adding 
genres) and png (handling of compressed comments).");
+DTDD("Sat Nov 13 13:23:23 EST 2004 | libextractor v0.3.11 released.",
+     "This release fixes bugs in the dvi, man, ID3v2.3, ole2 and pdf 
extractors.");
+DTDD("Sun Oct 18 13:23:35 EST 2004 | libextractor v0.3.10 released.", 
+     "This release adds support for ID3v2.3 and ID3v2.4.  It fixes bugs in the 
tar, man, deb, mp3 and ole2 extractors.");
+DTDD("Sat Oct 17 18:12:11 EST 2004 | libextractor v0.3.9 released.", 
+     "This release adds support for the man, tar (including tar.gz) and deb 
formats.  It fixes bugs in the id3v2 and jpeg extractors.  The size of jpeg 
images is now also extracted.  This version adds support for 64-bit file 
sizes.");
+DTDD("Sat Oct 02 20:00:04 EST 2004 | libextractor v0.3.8 released.",
+ "This release adds support for dvi (from TeX).  The plugins are now installed 
in a separate plugin directory.  libextractor now works under OS X (10.3)."); 
+DTDD("Fri Sep 23 23:30:33 EST 2004 | libextractor v0.3.7 released.",
+     "This release adds support for StarOffice formats, ID3v2 tags and the 
Ripe160MD hash function.  It also improves the performance of the HTML and ZIP 
extractors.");
+DTDD("Fri Sep 10 20:10:38 EST 2004 | libextractor v0.3.6 released.",
+     "This release adds support for OpenOffice formats, hash functions (md5, 
sha-1) and fixes some build problems.");
+DTDD("Mon Aug 30 23:18:49 IST 2004 | libextractor v0.3.5 released.",
+     "This release adds support for OLE2 (WinWord, PowerPoint, Excel formats) 
and fixes various minor bugs.  For OLE2 support you will have to have glib 2.0 
installed (yes, that is glib from GTK/Gnome, not glibc!).");
+DTDD("Thu Aug 26 20:27:24 IST 2004 | Bugtracking using Mantis enabled.",
+     "You can now report and view bug-reports about libextractor on %s.",
+     extlink_("https://gnunet.org/mantis/","Mantis";));
+DTDD("Wed Aug 25 19:02:07 IST 2004 | libextractor v0.3.4 released.",
+     "This release fixes a minor linking error (<tt>-lm</tt> for 
<tt>floor</tt>), improves performance and adds support for GNU gettext 
(internationalization).");
+DTDD("Wed May 31 19:22:07 EST 2004 | libextractor v0.3.3 released.",
+     "This release fixes various minor bugs (segmentation faults and 
non-termination of mpeg and riff extractors for malformed files) and adds 
support for WAV files.");
+DTDD("Wed May 31 19:22:07 EST 2004 | libextractor v0.3.2 released.",
+     "This release fixes various minor bugs (plugins misbehaving for malformed 
files) and improves portability to Cygwin/MinGW.");
+echo "</dl>";
 P();
-H3("Using different options for different directories");
-W("You can build a database from multiple doodle runs over distinct sets of 
files with different options.");
-W("For example, the following can make sense:");
-PRE("$ doodle -B en -b /usr/share/doc # full-text index over documentation\n" .
-    "$ doodle -b /usr /opt /bin /lib # normal index over other system files\n" 
.
-    "$ doodled -B en /home # monitor /home, with full-text support\n");
-W("A simple doodle search will then find files in all listed directories.");
-W("You can also build multiple disjoint databases and search all of them in 
one run (see %s for option <tt>-d</tt>).",
-  extlink_("man/doodle.html", "doodle"));
+W("%s",
+  intlink_("oldnews","Older news archive"));
 
-P();
-ANCHOR("mantis");
-H2("Bugtrack");
-W("Doodle uses Mantis for bugtracking.");
-W("Visit %s to report bugs.",
-  extlink_("https://gnunet.org/mantis/","https://gnunet.org/mantis/";));
-W("You need to sign up for a reporter account.");
-W("Please make sure you report bugs under <strong>Doodle</strong> and not 
under any of the other projects.");
-P();
-W("If you dislike Mantis and need to report a bug contact %s via e-mail.",
-  extlink_("mailto:address@hidden","address@hidden";));
-
-
 ANCHOR("links");
 H2("Links");
+P();
+W("Related work:");
 echo "<ul>";
-LILI("http://members.cox.net/sinzui/medusa/";, 
-     "Medusa, similar project for Gnome");
-LILI("http://swish-e.org/";, 
-     "Swish-e, indexing tool with focus on the WWW");
-LILI("http://www.gnome.org/~seth/storage/";,
-     "GNOME Storage");
-LILI("http://www.gnome.org/projects/beagle/";,
-     "Beagle");
-LILI("http://sourceforge.net/projects/rlocate/";,
-     "rlocate, version of locate that is always up-to-date");
-LILI("http://www.htdig.org/";,
-     "HTDig");
-LILI("http://jakarta.apache.org/lucene/";,
-     "Lucene");
-LILI("http://homepage.mac.com/pauljlucas/software/swish/";,
-     "Swish++");
-LILI("http://webglimpse.net/";,
-     "Glimpse");
-LILI("http://evidence.sf.net/";,
-     "Evidence, file-manager with support for doodle");
-LILI("http://www.linux-magazin.de/Artikel/ausgabe/2004/09/bgw/bgw.html";,
-     "Article about doodle (and other things) in the German Linux-Magazin");
+LILI("http://www.wotsit.org","File format database");
+LILI("http://getid3.sf.net/","getid3, similar project for PHP");
+LILI("download/php/",
+     "PHP wrapper for libextractor (mirrored, not written by us, see README)");
+LILI("http://dublincore.org/documents/dcmi-terms/","Meta-data categorization 
standard");
+LILI("http://hul.harvard.edu/jhove/","JHOVE, Harvard Object Validation 
Environment");
 echo "</ul>";
-HR();
-echo "<address><a href=\"mailto:address@hidden";>Christian 
Grothoff</a></address>";
-PRE("Copyright (C) 2004 Christian Grothoff.\n" .
-    "Verbatim copying and distribution of this entire article\n" .
-    "is permitted in any medium, provided this notice is preserved.");
-BR();
-generateFooter();
-echo "</body></html>\n";
+W("Projects that use libextractor:");
+echo "<ul>";
+LILI("http://witme.sourceforge.net/libferris.web/","libferris, a virtual file 
system");
+LILI("http://evidence.sf.net/","Evidence, enlightened file manager");
+LILI("http://gnunet.org/","GNUnet, secure P2P file sharing");
+LILI("http://gnunet.org/doodle/","doodle, index your disk");
+echo "</ul>";
+
+ANCHOR("contact");
+H2("Contact");
+P();
+W("libextractor is developed by %s and %s.",
+  ARRAY(extlink_("http://grothoff.org/christian/";,
+                "Christian Grothoff"),
+       extlink_("http://compilers.cs.purdue.edu/~vids/";,
+                "Vids Samanta")));
+W("For questions about libextractor send email to %s.",
+  extlink_("mailto:address@hidden";,
+          "address@hidden"));
+
+include("html_footer.php3");
 ?>
+

Modified: GNUnet-docs/WWW/index.php
===================================================================
--- GNUnet-docs/WWW/index.php   2005-04-11 06:52:55 UTC (rev 647)
+++ GNUnet-docs/WWW/index.php   2005-04-11 06:58:51 UTC (rev 648)
@@ -1,199 +1,83 @@
 <?php
-include("i18nhtml.inc");
-DOCTYPE("HTML", "Transitional");
-echo "<html><head>\n";
-if ($title) {
-  echo "<title>";
-  TRANSLATE("Doodle: find information on your computer");
-  echo "</title>";
- }
-if ($description) {
-  echo "<meta name=\"description\" content=\"";
-  TRANSLATE("A tool to index and search the files on your disk.");
-  echo "\">";
- }
-echo "<meta name=\"content-language\" content=\"" . 
-     $languagecodes[$lang] . "\">";
-echo "<meta name=\"language\" content=\"" . 
-     $languagecodes[$lang] . "\">";
-?>
-<meta name="author" content="Christian Grothoff">
-<meta name="keywords" 
content="doodle,desktop,search,suffix,tree,meta,data,libextractor,keywords,fam,index,database,free,Linux,GNU,GPL">
-<meta name="robots" content="index,follow">
-<meta name="revisit-after" content="28 days">
-<meta name="publisher" content="Christian Grothoff">
-<meta name="date" content="2004-12-31">
-<meta name="rights" content="(C) 2004 by Christian Grothoff>";
-<meta http-equiv="expires" content="43200">
-<meta http-equiv="content-type" content="text/html">
-</head>
-<body>
-<?php
-generateLanguageBar();
+include("scripts.php3");
+$title = "GNUnet";
+$description="GNUnet - an anonymous distributed backup system :-)";
+include("html_header.php3");
 
-H1("Doodle");
-ANCHOR("about");
-H2("About");
+H2("About GNUnet");
+gnunetlogo();
 
-W("Doodle is a tool to quickly search the documents on a computer.");
-W("Doodle builds an index using meta-data contained in the documents and 
allows fast searches on the resulting database.");
-W("Doodle uses %s to support obtaining meta-data from various file-formats.",
-  extlink_("/libextractor/","libextractor"));
-W("The database used by doodle is a %s, resulting in fast lookups.",
-  extlink_("http://www.nist.gov/dads/HTML/suffixtree.html","suffix tree"));
-W("Doodle supports approximate searches.");
-BR();
-W("Features that Doodle does not have at the moment include:");
-echo "<ul>";
-LI("A web interface");
-LI("Ordering of search results");
-LI("Spidering (indexing the Internet or websites)");
-echo "</ul>";
-W("If you need these features, have a look at the %s section.",
-  extlink_("#links", "links"));
-
+W("GNUnet is a framework for secure peer-to-peer networking that does not use 
any centralized or otherwise trusted services.");
+W("A first service implemented on top of the networking layer allows anonymous 
censorship-resistant file-sharing.");
+W("GNUnet uses a simple, excess-based economic model to allocate resources.");
+W("Peers in GNUnet monitor each others behavior with respect to resource 
usage; peers that contribute to the network are rewarded with better service.");
 P();
-W("Doodle is licensed under the %s.",
-  extlink_("http://www.gnu.org/licenses/gpl.html","GNU GPL"));
-W("Indexing large volumes can take several hundred MBs of memory (depending on 
the amount of meta-data found).");
-W("Searching should nevertheless require almost no memory.");
-W("Using the latest version of libextractor is recommended.");
-W("Doodle has so far only been tested under %s and %s %s %s.",
-  ARRAY(extlink_("http://www.debian.org/";, "Debian"),
-        extlink_("http://www.redhat.com/";, "RedHat"),
-        extlink_("http://www.gnu.org/";, "GNU"),
-        extlink_("http://www.linux.org/";, "Linux")));
-W("Doodle is expected it to work under any platform supported by %s.",
-  extlink_("/libextractor/", "libextractor"));
-P();
 
-ANCHOR("download");
-H2("Download");
-W("You can find the current release %s.",
-  extlink_("download/doodle-0.6.2.tar.gz", "here"));
-W("Man-pages for %s, %s and %s are also on-line.",
-  ARRAY(extlink_("man/doodle.html", "doodle"),
-        extlink_("man/doodled.html", "doodled"),
-        extlink_("man/libdoodle", "libdoodle")));
+W("GNUnet is part of the %s.",
+  extlink_("http://www.gnu.org/","GNU project"));
+W("Our official GNU website can be found at %s.",
+  
extlink_("http://www.gnu.org/software/gnunet/","http://www.gnu.org/software/gnunet/";));
+W("GNUnet can be downloaded from this site or the %s.",
+  extlink_("http://www.gnu.org/prep/ftp.html","GNU mirrors"));
 
-W("The latest version can be obtained using");
-PRE("$ svn checkout https://gnunet.org/svn/doodle/";);
-P();    
-W("If you want to be notified about updates, subscribe to %s",
-  extlink_("http://freshmeat.net/projects/doodle/";, "doodle on freshmeat"));
 P();
-W("Debian packages provided by Daniel Baumann can be found %s.",
-  extlink_("http://packages.debian.org/doodle";, "here"));
-W("RedHat/Fedora RPM packages provided by Dag Wieers can be found %s.",
-  extlink_("http://dag.wieers.com/packages/doodle/","here";));
-P();
+H2("News");
+W("Older news can be found %s.\n",
+  intlink_("old_news.php3", "here"));
+echo "<dl>\n";
 
-ANCHOR("using");
-H2("Using doodle");
-W("First the doodle database needs to be created.");
-W("The simplest way to create the database is to run doodle with the 
<tt>-b</tt> option on the directories that are to be indexed.");
-W("For example:");
-PRE("$ doodle -b $HOME");
-W("This will create the doodle database under <tt>~/.doodle</tt>.");
-BR();
-W("After creating the doodle database, you can search it.");
-W("For example:");
-PRE("$ doodle keyword");
-BR();
-H3("Keeping the database up-to-date");
-W("If you want to keep your doodle database up-to-date, you can either 
periodically re-run doodle with the <tt>-b</tt> option, or you can use doodled, 
the doodle daemon.");
-W("doodled uses %s to notice whenever a file is changed and instantly updates 
the doodle database.",
-  "fam");
-W("In order to use doodled, you must have famd running.");
-W("If famd is running, you can start doodled by passing the same arguments 
that you would pass to doodle to construct the database, but without the 
<tt>-b</tt> option:");
-PRE("$ doodled $HOME");
-W("You can also use doodled to construct the initial database.");
-W("While doodled is updating the database, any doodle search will block until 
the update is complete.");
-W("Note that while you may want to index your entire disk (i.e., <tt>doodle -b 
/</tt>), it is typically not a great idea to have doodled monitor your entire 
system for changes -- especially since <tt>/usr</tt> is unlikely to change 
frequently.");
-W("You can address this issue by first indexing <tt>/</tt> and then using 
doodled to monitor only directories that change frequently:");
-PRE("$ doodle -b /\n" .
-    "$ doodled $HOME");
-W("This way, your entire system will be in the index, and your home directory 
will be always up-to-date.");
-P();
-H3("Full-text search");
-W("You can achieve a (limited) form of full-text search with doodle.");
-W("For that, the dictionary-based plaintext extractors from %s are used.",
-  extlink_("/libextractor/","libextractor"));
-W("In order to use them, you need to pass the option <tt>-b LANG</tt> to 
doodle.");
-W("LANG is a two letter language code that selects the dictionary.");
-W("Available languages at the moment are en, es, fr, it and no.");
-W("Words and sentences that are available in the respective dictionaries for 
these languages will then be added to the index.");
-W("While libextractor attempts to avoid full-text extraction for certain kown 
binary formats, it may still find words in non-text files.");
-W("Running with this option will dramatically increase the size of the index 
and the time it takes to build the index.");
-W("Note that if you change the options used to build a database will not (!) 
result in doodle re-indexing files that were processed with other options 
previously.");
-W("The only way to force doodle to re-index files with different options is to 
either touch the files (change modification timestamp) or to delete the old 
database and start from scratch.");
+function convert_time($mysql_timestamp){
+if (ereg("^([0-9]{4})([0-9]{2})([0-9]{2})([0-9]{2})" .
+           "([0-9]{2})([0-9]{2})",$mysql_timestamp,$res)):
+  $year=$res[1];
+  $month=$res[2];
+  $day=$res[3];
+  $hour=$res[4];
+  $min=$res[5];
+  $sec=$res[6];
 
-P();
-H3("Hints for system administrators");
-W("If you are the system administrator, you might want to run doodle on the 
entire system periodically (cron job) and have doodled monitor the home 
directories in the background.");
-W("In that case, it is suggested to have the doodle database be group-readable 
for a group doodle.");
-W("Set the permissions for the doodle binary to SGID to allow users to poll 
the database.");
-W("Doodle will ensure that information about files not accessible to the user 
are not leaked by checking if files found in the database are accessible to the 
user.");
-W("doodled has to run as root since otherwise it would be impossible to index 
the personal files of all users.");
-W("If that it too risky, doodled will still work, but only index the files 
readable to the user that runs doodled.");
+ return(array($year,$month,$day,$hour,$min,$sec));
+  else:
+     return(false);
+ endif;
+}
 
-
+// definition: news is what is less than 3 months old :-)
+$query = "SELECT title,include,posted FROM news " .
+   "WHERE TO_DAYS(NOW())-TO_DAYS(posted) < 90 " .
+   "ORDER BY posted DESC";
+$result = mysql_query($query, $connection);
+$num = 0;
+if ($result) {
+  $num = mysql_numrows($result);
+}
+for ($i=0;$i<$num;$i++) {
+  $row = mysql_fetch_array($result);
+  $pd = convert_time($row["posted"]);
+  echo "<dt>" . $pd[0] . "-" . $pd[1] . "-" . $pd[2] .  ": " . 
W_($row["title"]) . "</dt>\n";
+  echo "<dd>\n";
+  include($row["include"]);
+  echo "</dd>\n";
+}
+echo "</dl>\n";
 P();
-H3("Using different options for different directories");
-W("You can build a database from multiple doodle runs over distinct sets of 
files with different options.");
-W("For example, the following can make sense:");
-PRE("$ doodle -B en -b /usr/share/doc # full-text index over documentation\n" .
-    "$ doodle -b /usr /opt /bin /lib # normal index over other system files\n" 
.
-    "$ doodled -B en /home # monitor /home, with full-text support\n");
-W("A simple doodle search will then find files in all listed directories.");
-W("You can also build multiple disjoint databases and search all of them in 
one run (see %s for option <tt>-d</tt>).",
-  extlink_("man/doodle.html", "doodle"));
-
+H2("Roadmap");
+W("Here is the current development plan:");
+echo "<ul>\n";
+LI("fix %s",
+   extlink_("https://gnunet.org/mantis/","bugs";));
+LI("improve handling of pseudonyms (manage reputation in namespaces)");
+LI("add testbed harness to allow automated testing and profiling (%s)",
+   extlink_("mailto:address@hidden","contact";));
+LI("extend GTK UI (delete, statistics, configuration, recursive insertion)");
+LI("add download-daemon that manages ongoing/completed/stalled downloads");
+echo "</ul>\n";
 P();
-ANCHOR("mantis");
-H2("Bugtrack");
-W("Doodle uses Mantis for bugtracking.");
-W("Visit %s to report bugs.",
-  extlink_("https://gnunet.org/mantis/","https://gnunet.org/mantis/";));
-W("You need to sign up for a reporter account.");
-W("Please make sure you report bugs under <strong>Doodle</strong> and not 
under any of the other projects.");
-P();
-W("If you dislike Mantis and need to report a bug contact %s via e-mail.",
-  extlink_("mailto:address@hidden","address@hidden";));
+H2("Contact");
+W("GNUnet is developed by %s.",
+  extlink_("http://www.gnu.org/software/gnunet/","the GNUnet developers"));
+W("For questions about GNUnet send E-Mail to %s.",
+  extlink_("mailto:address@hidden","address@hidden";));
 
-
-ANCHOR("links");
-H2("Links");
-echo "<ul>";
-LILI("http://members.cox.net/sinzui/medusa/";, 
-     "Medusa, similar project for Gnome");
-LILI("http://swish-e.org/";, 
-     "Swish-e, indexing tool with focus on the WWW");
-LILI("http://www.gnome.org/~seth/storage/";,
-     "GNOME Storage");
-LILI("http://www.gnome.org/projects/beagle/";,
-     "Beagle");
-LILI("http://sourceforge.net/projects/rlocate/";,
-     "rlocate, version of locate that is always up-to-date");
-LILI("http://www.htdig.org/";,
-     "HTDig");
-LILI("http://jakarta.apache.org/lucene/";,
-     "Lucene");
-LILI("http://homepage.mac.com/pauljlucas/software/swish/";,
-     "Swish++");
-LILI("http://webglimpse.net/";,
-     "Glimpse");
-LILI("http://evidence.sf.net/";,
-     "Evidence, file-manager with support for doodle");
-LILI("http://www.linux-magazin.de/Artikel/ausgabe/2004/09/bgw/bgw.html";,
-     "Article about doodle (and other things) in the German Linux-Magazin");
-echo "</ul>";
-HR();
-echo "<address><a href=\"mailto:address@hidden";>Christian 
Grothoff</a></address>";
-PRE("Copyright (C) 2004 Christian Grothoff.\n" .
-    "Verbatim copying and distribution of this entire article\n" .
-    "is permitted in any medium, provided this notice is preserved.");
-BR();
-generateFooter();
-echo "</body></html>\n";
+include("html_footer.php3");
 ?>

Added: i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.bz2
===================================================================
(Binary files differ)


Property changes on: i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.bz2
___________________________________________________________________
Name: svn:mime-type
   + application/octet-stream

Added: i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.gz
===================================================================
(Binary files differ)


Property changes on: i18nHTML-docs/WWW/download/i18nHTML-0.2.0.tar.gz
___________________________________________________________________
Name: svn:mime-type
   + application/octet-stream

Modified: i18nHTML-docs/WWW/index.php
===================================================================
--- i18nHTML-docs/WWW/index.php 2005-04-11 06:52:55 UTC (rev 647)
+++ i18nHTML-docs/WWW/index.php 2005-04-11 06:58:51 UTC (rev 648)
@@ -2,198 +2,84 @@
 include("i18nhtml.inc");
 DOCTYPE("HTML", "Transitional");
 echo "<html><head>\n";
-if ($title) {
-  echo "<title>";
-  TRANSLATE("Doodle: find information on your computer");
-  echo "</title>";
- }
-if ($description) {
-  echo "<meta name=\"description\" content=\"";
-  TRANSLATE("A tool to index and search the files on your disk.");
-  echo "\">";
- }
-echo "<meta name=\"content-language\" content=\"" . 
-     $languagecodes[$lang] . "\">";
-echo "<meta name=\"language\" content=\"" . 
-     $languagecodes[$lang] . "\">";
+TITLE("i18nHTML - enabling collaborative webpage translation");
+echo "<meta name=\"description\" content=\"";
+TRANSLATE("i18nHTML is a collection of PHP scripts that allow visitors of a 
webpage to help translating it.");
+echo "\">";
 ?>
 <meta name="author" content="Christian Grothoff">
-<meta name="keywords" 
content="doodle,desktop,search,suffix,tree,meta,data,libextractor,keywords,fam,index,database,free,Linux,GNU,GPL">
+<meta name="keywords" 
content="i18n,HTML,PHP,translation,languages,mysql,database,internationalization,www,free,GNU,GPL">
 <meta name="robots" content="index,follow">
 <meta name="revisit-after" content="28 days">
 <meta name="publisher" content="Christian Grothoff">
-<meta name="date" content="2004-12-31">
-<meta name="rights" content="(C) 2004 by Christian Grothoff>";
+<meta name="date" content="2005-01-03">
+<meta name="rights" content="(C) 2004,2005 by Christian Grothoff>";
 <meta http-equiv="expires" content="43200">
 <meta http-equiv="content-type" content="text/html">
 </head>
 <body>
 <?php
 generateLanguageBar();
-
-H1("Doodle");
-ANCHOR("about");
+H1("i18nHTML");
 H2("About");
-
-W("Doodle is a tool to quickly search the documents on a computer.");
-W("Doodle builds an index using meta-data contained in the documents and 
allows fast searches on the resulting database.");
-W("Doodle uses %s to support obtaining meta-data from various file-formats.",
-  extlink_("/libextractor/","libextractor"));
-W("The database used by doodle is a %s, resulting in fast lookups.",
-  extlink_("http://www.nist.gov/dads/HTML/suffixtree.html","suffix tree"));
-W("Doodle supports approximate searches.");
-BR();
-W("Features that Doodle does not have at the moment include:");
-echo "<ul>";
-LI("A web interface");
-LI("Ordering of search results");
-LI("Spidering (indexing the Internet or websites)");
-echo "</ul>";
-W("If you need these features, have a look at the %s section.",
-  extlink_("#links", "links"));
-
+W("i18nHTML is a collection of PHP files that can be used to write webpages 
that visitors can translate into their respective native languages.");
+W("i18nHTML uses a database to match sentences from the webpage against 
translations.");
+W("i18nHTML defines a set of PHP functions that generate either the translated 
HTML sentences or the original (typically English) text with decorations that 
allow users to provide translations.");
+W("i18nHTML requires the internationalized webpages to be written using the 
provided PHP functions but does not constrain the page design in any way.");
+W("Webpages internationalized with i18nHTML can be updated without loosing 
existing translations for sentences that were not changed.");
+W("Note that it is important that you use the i18nHTML <tt>TITLE</tt> command 
in your documents in order to ensure that the character set and other meta-data 
is set properly.");
 P();
-W("Doodle is licensed under the %s.",
-  extlink_("http://www.gnu.org/licenses/gpl.html","GNU GPL"));
-W("Indexing large volumes can take several hundred MBs of memory (depending on 
the amount of meta-data found).");
-W("Searching should nevertheless require almost no memory.");
-W("Using the latest version of libextractor is recommended.");
-W("Doodle has so far only been tested under %s and %s %s %s.",
-  ARRAY(extlink_("http://www.debian.org/";, "Debian"),
-        extlink_("http://www.redhat.com/";, "RedHat"),
-        extlink_("http://www.gnu.org/";, "GNU"),
-        extlink_("http://www.linux.org/";, "Linux")));
-W("Doodle is expected it to work under any platform supported by %s.",
-  extlink_("/libextractor/", "libextractor"));
+H2("News");
+H3("i18nHTML 0.1.0 released");
+W("i18nHTML 0.1.0 is expected to solve various character set encoding 
issues.");
+W("It also ensures that all entered translations match the original sentence 
in the number of escape sequences.");
+W("The new version also resolves various minor bugs (such as editor mode only 
working with php-register-globals enabled).");
 P();
-
-ANCHOR("download");
+W("Upgrading from i18nHTML 0.0.2 to 0.1.0 requires changes to the encoding of 
strings in the database (which is now hopefully properly based on unicode).");
+W("This can be done by running the update.php script and feeding the SQL 
statements that update.php generates into MySQL.");
+W("Running <tt>update.php</tt> by itself will not do the data conversion (for 
security reasons).");
+W("You should backup your old translation database first.");
+W("mysqldump should be useful here.");
+W("Note that <tt>update.php</tt> may discard translations that it believes 
have serious character set (or other) problems.");
+W("The total number of discarded translations can be found at the end of the 
output (in a generated comment).");
+P();
+W("Another important step in upgrading from 0.0.2 to 0.1.0 is to use the new 
<tt>TITLE</tt> function to generate the title of all webpages.");
+W("The reason is that the <tt>TITLE</tt> function will generate other HTML 
tags that should be placed in the HTML header to help ensure that the browser 
picks up the character encodings correctly.");
+P();
 H2("Download");
-W("You can find the current release %s.",
-  extlink_("download/doodle-0.6.2.tar.gz", "here"));
-W("Man-pages for %s, %s and %s are also on-line.",
-  ARRAY(extlink_("man/doodle.html", "doodle"),
-        extlink_("man/doodled.html", "doodled"),
-        extlink_("man/libdoodle", "libdoodle")));
-
-W("The latest version can be obtained using");
-PRE("$ svn checkout https://gnunet.org/svn/doodle/";);
+W("You can find the latest version %s.",
+  extlink_("https://gnunet.org/i18nHTML/download/";, "here"));
+W("The latest SVN version can be obtained using");
+PRE("$ svn checkout https://gnunet.org/svn/i18nHTML/";);
 P();    
 W("If you want to be notified about updates, subscribe to %s",
-  extlink_("http://freshmeat.net/projects/doodle/";, "doodle on freshmeat"));
+  extlink_("http://freshmeat.net/projects/i18nHTML/";, "i18nHTML on 
freshmeat"));
 P();
-W("Debian packages provided by Daniel Baumann can be found %s.",
-  extlink_("http://packages.debian.org/doodle";, "here"));
-W("RedHat/Fedora RPM packages provided by Dag Wieers can be found %s.",
-  extlink_("http://dag.wieers.com/packages/doodle/","here";));
-P();
 
-ANCHOR("using");
-H2("Using doodle");
-W("First the doodle database needs to be created.");
-W("The simplest way to create the database is to run doodle with the 
<tt>-b</tt> option on the directories that are to be indexed.");
-W("For example:");
-PRE("$ doodle -b $HOME");
-W("This will create the doodle database under <tt>~/.doodle</tt>.");
-BR();
-W("After creating the doodle database, you can search it.");
-W("For example:");
-PRE("$ doodle keyword");
-BR();
-H3("Keeping the database up-to-date");
-W("If you want to keep your doodle database up-to-date, you can either 
periodically re-run doodle with the <tt>-b</tt> option, or you can use doodled, 
the doodle daemon.");
-W("doodled uses %s to notice whenever a file is changed and instantly updates 
the doodle database.",
-  "fam");
-W("In order to use doodled, you must have famd running.");
-W("If famd is running, you can start doodled by passing the same arguments 
that you would pass to doodle to construct the database, but without the 
<tt>-b</tt> option:");
-PRE("$ doodled $HOME");
-W("You can also use doodled to construct the initial database.");
-W("While doodled is updating the database, any doodle search will block until 
the update is complete.");
-W("Note that while you may want to index your entire disk (i.e., <tt>doodle -b 
/</tt>), it is typically not a great idea to have doodled monitor your entire 
system for changes -- especially since <tt>/usr</tt> is unlikely to change 
frequently.");
-W("You can address this issue by first indexing <tt>/</tt> and then using 
doodled to monitor only directories that change frequently:");
-PRE("$ doodle -b /\n" .
-    "$ doodled $HOME");
-W("This way, your entire system will be in the index, and your home directory 
will be always up-to-date.");
-P();
-H3("Full-text search");
-W("You can achieve a (limited) form of full-text search with doodle.");
-W("For that, the dictionary-based plaintext extractors from %s are used.",
-  extlink_("/libextractor/","libextractor"));
-W("In order to use them, you need to pass the option <tt>-b LANG</tt> to 
doodle.");
-W("LANG is a two letter language code that selects the dictionary.");
-W("Available languages at the moment are en, es, fr, it and no.");
-W("Words and sentences that are available in the respective dictionaries for 
these languages will then be added to the index.");
-W("While libextractor attempts to avoid full-text extraction for certain kown 
binary formats, it may still find words in non-text files.");
-W("Running with this option will dramatically increase the size of the index 
and the time it takes to build the index.");
-W("Note that if you change the options used to build a database will not (!) 
result in doodle re-indexing files that were processed with other options 
previously.");
-W("The only way to force doodle to re-index files with different options is to 
either touch the files (change modification timestamp) or to delete the old 
database and start from scratch.");
 
-P();
-H3("Hints for system administrators");
-W("If you are the system administrator, you might want to run doodle on the 
entire system periodically (cron job) and have doodled monitor the home 
directories in the background.");
-W("In that case, it is suggested to have the doodle database be group-readable 
for a group doodle.");
-W("Set the permissions for the doodle binary to SGID to allow users to poll 
the database.");
-W("Doodle will ensure that information about files not accessible to the user 
are not leaked by checking if files found in the database are accessible to the 
user.");
-W("doodled has to run as root since otherwise it would be impossible to index 
the personal files of all users.");
-W("If that it too risky, doodled will still work, but only index the files 
readable to the user that runs doodled.");
 
-
 P();
-H3("Using different options for different directories");
-W("You can build a database from multiple doodle runs over distinct sets of 
files with different options.");
-W("For example, the following can make sense:");
-PRE("$ doodle -B en -b /usr/share/doc # full-text index over documentation\n" .
-    "$ doodle -b /usr /opt /bin /lib # normal index over other system files\n" 
.
-    "$ doodled -B en /home # monitor /home, with full-text support\n");
-W("A simple doodle search will then find files in all listed directories.");
-W("You can also build multiple disjoint databases and search all of them in 
one run (see %s for option <tt>-d</tt>).",
-  extlink_("man/doodle.html", "doodle"));
+if ( ($xlang) && ($xlang != "English")) {
+  H2("Mass translation");
+  W("The mass-translation page for translating many sentences at once is %s.",
+    intlink_("editor.php", "here"));
+  W("Note that the sentence database is shared with the %s, %s and %s 
projects.",
+    ARRAY(extlink_("http://gnunet.org/";, "GNUnet"),
+         extlink_("http://gnunet.org/doodle/";, "doodle"),
+         extlink_("http://gnunet.org/libextractor/";, "libExtractor")));  
+ }
 
-P();
-ANCHOR("mantis");
 H2("Bugtrack");
-W("Doodle uses Mantis for bugtracking.");
+W("i18nHTML uses Mantis for bugtracking.");
 W("Visit %s to report bugs.",
   extlink_("https://gnunet.org/mantis/","https://gnunet.org/mantis/";));
 W("You need to sign up for a reporter account.");
-W("Please make sure you report bugs under <strong>Doodle</strong> and not 
under any of the other projects.");
+W("Please make sure you report bugs under <strong>I18nHTML</strong> and not 
under any of the other projects.");
 P();
-W("If you dislike Mantis and need to report a bug contact %s via e-mail.",
+W("If you dislike Mantis and need to report a bug contact %s via e-mail (good 
luck getting by the spam-filter).",
   extlink_("mailto:address@hidden","address@hidden";));
 
-
-ANCHOR("links");
-H2("Links");
-echo "<ul>";
-LILI("http://members.cox.net/sinzui/medusa/";, 
-     "Medusa, similar project for Gnome");
-LILI("http://swish-e.org/";, 
-     "Swish-e, indexing tool with focus on the WWW");
-LILI("http://www.gnome.org/~seth/storage/";,
-     "GNOME Storage");
-LILI("http://www.gnome.org/projects/beagle/";,
-     "Beagle");
-LILI("http://sourceforge.net/projects/rlocate/";,
-     "rlocate, version of locate that is always up-to-date");
-LILI("http://www.htdig.org/";,
-     "HTDig");
-LILI("http://jakarta.apache.org/lucene/";,
-     "Lucene");
-LILI("http://homepage.mac.com/pauljlucas/software/swish/";,
-     "Swish++");
-LILI("http://webglimpse.net/";,
-     "Glimpse");
-LILI("http://evidence.sf.net/";,
-     "Evidence, file-manager with support for doodle");
-LILI("http://www.linux-magazin.de/Artikel/ausgabe/2004/09/bgw/bgw.html";,
-     "Article about doodle (and other things) in the German Linux-Magazin");
-echo "</ul>";
 HR();
-echo "<address><a href=\"mailto:address@hidden";>Christian 
Grothoff</a></address>";
-PRE("Copyright (C) 2004 Christian Grothoff.\n" .
-    "Verbatim copying and distribution of this entire article\n" .
-    "is permitted in any medium, provided this notice is preserved.");
-BR();
 generateFooter();
 echo "</body></html>\n";
 ?>





reply via email to

[Prev in Thread] Current Thread [Next in Thread]