Subject: mailing-list for TeXmacs Users
List archive
From : "Zoltán Kovács" <address@hidden>- To: address@hidden
- Subject: Re: [TeXmacs] Re: frenchspacing?
- Date: Wed, 7 Nov 2007 09:42:10 +0100
- Domainkey-signature: a=rsa-sha1; c=nofws; d=gmail.com; s=beta; h=received:message-id:date:from:to:subject:in-reply-to:mime-version:content-type:references; b=KU6MiJzVajC8XXuiyzl/tqbht+YooPD35g9QiXk9VuADwXchQOzz8HkGHlpi585af5233Z6sX1UbJTa47g3gAQ2t52Op+pP0h12hnvkaexFpmkX+eSMmNzpsp5pQzLDwA9X5utN2la3zgaOG+IMrANqHougaVeO5PsTHIFEsfN8=
Hi, I'm not sure it really works. It seems that it isn't. However, I can send you the modified file in the attachment.
Best regards, Zoltan
2007/11/7,
address@hidden <address@hidden>:
Hi, coiuld you post the changes you made
thank you
Le mardi 06 novembre 2007 à 18:01 +0100, Zoltán Kovács a écrit :
Dear Joris,
thank you for the help! I made just a short fix for my need, changing only the text_language part, but currently it is OK for me. (Clearly, I cannot contribute an enhancement for TeXmacs now, but I'm in a hurry now... ;-)
Best regards, Zoltan
2007/10/30, Joris van der Hoeven <address@hidden>:
Hi Zoltan,
On Mon, Oct 29, 2007 at 09:38:56PM +0100, Zoltán Kovács wrote:
> Dear All, I resend this question. Frenchspacing means that no double spaces
> are put after sentences, only one space. I found nothing about this in
> Google.
I did not have time yet to do this.
However, if you know a bit about C++ and have a few hours,
then it is quite easy to add this yourself.
Take a look at
src/Resources/Languages/text_language.cpp
The idea would be to copy the text_language_rep class and
make a second french_language_rep class with the correct
amounts of space evrywhere. I recommend to check in an official
book about french typography: there are also half spaces and
three quarters of a space for certain ponctuation symbols.
The same procedure applies to other languages.
Best wishes, Joris
--
matek.hu --- mert matekból érettségizni mindenkinek kell...
--
matek.hu --- mert matekból érettségizni mindenkinek kell...
/******************************************************************************
* MODULE : text_language.cpp
* DESCRIPTION: natural textual languages
* COPYRIGHT : (C) 1999 Joris van der Hoeven
*******************************************************************************
* This software falls under the GNU general public license and comes WITHOUT
* ANY WARRANTY WHATSOEVER. See the file $TEXMACS_PATH/LICENSE for more details.
* If you don't have this file, write to the Free Software Foundation, Inc.,
* 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
******************************************************************************/
#include "analyze.hpp"
#include "language.hpp"
#include "Languages/hyphenate.hpp"
#include "Languages/impl_language.hpp"
#include "sys_utils.hpp"
/******************************************************************************
* Western text languages
******************************************************************************/
struct text_language_rep: language_rep {
hashmap<string,string> H;
text_language_rep (string lan_name, string hyph_name);
text_property advance (string s, int& pos);
array<int> get_hyphens (string s);
void hyphenate (string s, int after, string& left, string& right);
};
text_language_rep::text_language_rep (string lan_name, string hyph_name):
language_rep (lan_name), H (load_hyphen_table (hyph_name)) {}
text_property
text_language_rep::advance (string s, int& pos) {
if (pos == N(s)) return &tp_normal_rep;
if (s[pos]==' ') {
pos++;
// while ((pos<N(s)) && (s[pos]==' ')) pos++;
if ((pos == N(s)) || (!is_punctuation (s[pos])))
return &tp_space_rep;
return &tp_blank_rep;
}
if (is_punctuation (s[pos])) {
while ((pos<N(s)) && is_punctuation (s[pos])) pos++;
if ((pos==N(s)) || (s[pos]!=' ')) return &tp_normal_rep;
switch (s[pos-1]) {
case ',': case ':': case ';': case '`': case '\'': case '.': case '!': case '?':
return &tp_space_rep;
// case '.': case '!': case '?':
// return &tp_period_rep;
}
return &tp_space_rep;
}
if (s[pos]=='-') {
pos++;
while ((pos<N(s)) && (s[pos]=='-')) pos++;
return &tp_hyph_rep;
}
if (is_iso_alpha (s[pos])) {
while ((pos<N(s)) && is_iso_alpha (s[pos])) pos++;
return &tp_normal_rep;
}
if (is_numeric (s[pos])) { // can not be a '.'
while ((pos<N(s)) && is_numeric (s[pos])) pos++;
while (s[pos-1]=='.') pos--;
return &tp_normal_rep;
}
if (s[pos]=='<') {
while ((pos<N(s)) && (s[pos]!='>')) pos++;
if (pos<N(s)) pos++;
return &tp_normal_rep;
}
pos++;
return &tp_normal_rep;
}
array<int>
text_language_rep::get_hyphens (string s) {
return ::get_hyphens (s, H);
}
void
text_language_rep::hyphenate (
string s, int after, string& left, string& right)
{
array<int> penalty= get_hyphens (s);
std_hyphenate (s, after, left, right, penalty[after]);
}
/******************************************************************************
* Oriental languages
******************************************************************************/
struct oriental_language_rep: language_rep {
oriental_language_rep (string lan_name);
text_property advance (string s, int& pos);
array<int> get_hyphens (string s);
void hyphenate (string s, int after, string& left, string& right);
};
oriental_language_rep::oriental_language_rep (string lan_name):
language_rep (lan_name) {}
text_property
oriental_language_rep::advance (string s, int& pos) {
if (pos == N(s)) return &tp_normal_rep;
if (s[pos]==' ') {
pos++;
if ((pos == N(s)) || (!is_punctuation (s[pos])))
return &tp_space_rep;
return &tp_blank_rep;
}
int begin= pos;
while (pos<N(s) && s[pos] != ' ') {
int start= pos;
tm_char_forwards (s, pos);
string c= s (start, pos);
if (starts (c, "<#300") && N(c) == 7) {
if (start > begin) pos= start;
break;
}
}
return &tp_normal_rep;
}
array<int>
oriental_language_rep::get_hyphens (string s) {
int i, n= N(s);
array<int> T (n-1);
for (i=0; i<n-1; i++)
T[i]= HYPH_INVALID;
for (i=0, tm_char_forwards (s, i); i<n; tm_char_forwards (s, i))
if (s[i] == '<')
T[i-1]= 0;
return T;
}
void
oriental_language_rep::hyphenate (
string s, int after, string& left, string& right)
{
left = s (0, after+1);
right= s (after+1, N(s));
}
/******************************************************************************
* Miscellaneous language related routines
******************************************************************************/
string
locale_to_language (string s) {
if (N(s) > 5) s= s (0, 5);
if (s == "en_GB") return "british";
if (s == "zh_TW") return "taiwanese";
if (N(s) > 2) s= s (0, 2);
if (s == "bg") return "bulgarian";
if (s == "zh") return "chinese";
if (s == "cs") return "czech";
if (s == "da") return "danish";
if (s == "nl") return "dutch";
if (s == "en") return "english";
if (s == "fi") return "finnish";
if (s == "fr") return "french";
if (s == "de") return "german";
if (s == "hu") return "hungarian";
if (s == "it") return "italian";
if (s == "ja") return "japanese";
if (s == "ko") return "korean";
if (s == "pl") return "polish";
if (s == "pt") return "portuguese";
if (s == "ro") return "romanian";
if (s == "ru") return "russian";
if (s == "sl") return "slovene";
if (s == "es") return "spanish";
if (s == "sv") return "swedish";
if (s == "uk") return "ukrainian";
return "english";
}
string
language_to_locale (string s) {
if (s == "american") return "en_US";
if (s == "british") return "en_GB";
if (s == "bulgarian") return "bg_BG";
if (s == "chinese") return "zh_CN";
if (s == "czech") return "cs_CZ";
if (s == "danish") return "da_DK";
if (s == "dutch") return "nl_NL";
if (s == "english") return "en_US";
if (s == "finnish") return "fi_FI";
if (s == "french") return "fr_FR";
if (s == "german") return "de_DE";
if (s == "hungarian") return "hu_HU";
if (s == "italian") return "it_IT";
if (s == "japanese") return "ja_JP";
if (s == "korean") return "ko_KR";
if (s == "polish") return "pl_PL";
if (s == "portuguese") return "pt_PT";
if (s == "romanian") return "ro_RO";
if (s == "russian") return "ru_RU";
if (s == "slovene") return "sl_SI";
if (s == "spanish") return "es_ES";
if (s == "swedish") return "sv_SV";
if (s == "taiwanese") return "zh_TW";
if (s == "ukrainian") return "uk_UA";
return "en_US";
}
string
get_locale_language () {
string env_lan= get_env ("LC_ALL");
if (env_lan != "") return locale_to_language (env_lan);
env_lan= get_env ("LC_MESSAGES");
if (env_lan != "") return locale_to_language (env_lan);
env_lan= get_env ("LANG");
if (env_lan != "") return locale_to_language (env_lan);
env_lan= get_env ("GDM_LANG");
if (env_lan != "") return locale_to_language (env_lan);
return "english";
}
static string
simplify_date (string s) {
int i, n=N(s);
string r;
for (i=0; i<n; i++)
if ((s[i]!='0') || ((N(r)>0) && is_digit(r[N(r)-1]))) r << s[i];
return r;
}
string
get_date (string lan, string fm) {
#ifdef OS_WIN32
return "not implemented";
#else
if (fm == "") {
if ((lan == "british") || (lan == "english") || (lan == "american"))
fm= "%B %d, %Y";
else if (lan == "german")
fm= "%d. %B %Y";
else if (lan == "chinese" || lan == "japanese" ||
lan == "korean" || lan == "taiwanese")
{
string y= simplify_date (var_eval_system ("date +\"%Y\""));
string m= simplify_date (var_eval_system ("date +\"%m\""));
string d= simplify_date (var_eval_system ("date +\"%d\""));
if (lan == "japanese")
return y * "<#5e74>" * m * "<#6708>" * d * "<#65e5>";
if (lan == "korean")
return y * "<#b144> " * m * "<#c6d4> " * d * "<#c77c>";
return y * "," * m * "," * d;
}
else fm= "%d %B %Y";
}
lan= language_to_locale (lan);
string old= get_env ("LANG");
set_env ("LANG", lan);
string date= simplify_date (var_eval_system ("date +\"" * fm * "\""));
if ((lan == "cz_CZ") || (lan == "hu_HU") || (lan == "pl_PL"))
date= il2_to_cork (date);
// if (lan == "ru_RU") date= iso_to_koi8 (date);
set_env ("LANG", old);
return date;
#endif
}
/******************************************************************************
* Main interface
******************************************************************************/
language
text_language (string s) {
if (language::instances -> contains (s)) return language (s);
if (s == "american") return new text_language_rep (s, "us");
if (s == "british") return new text_language_rep (s, "ukenglish");
if (s == "bulgarian") return new text_language_rep (s, "bulgarian");
if (s == "chinese") return new oriental_language_rep (s);
if (s == "czech") return new text_language_rep (s, "czech");
if (s == "danish") return new text_language_rep (s, "danish");
if (s == "dutch") return new text_language_rep (s, "dutch");
if (s == "english") return new text_language_rep (s, "us");
if (s == "finnish") return new text_language_rep (s, "finnish");
if (s == "french") return new text_language_rep (s, "french");
if (s == "german") return new text_language_rep (s, "german");
if (s == "hungarian") return new text_language_rep (s, "hungarian");
if (s == "italian") return new text_language_rep (s, "italian");
if (s == "japanese") return new oriental_language_rep (s);
if (s == "korean") return new oriental_language_rep (s);
if (s == "polish") return new text_language_rep (s, "polish");
if (s == "portuguese") return new text_language_rep (s, "portuguese");
if (s == "romanian") return new text_language_rep (s, "romanian");
if (s == "russian") return new text_language_rep (s, "russian");
if (s == "slovene") return new text_language_rep (s, "slovene");
if (s == "spanish") return new text_language_rep (s, "spanish");
if (s == "swedish") return new text_language_rep (s, "swedish");
if (s == "taiwanese") return new oriental_language_rep (s);
if (s == "ukrainian") return new text_language_rep (s, "ukrainian");
if (s == "verbatim") return new verb_language_rep ();
cerr << "\nThe language was " << s << "\n";
fatal_error ("unknown language", "text_language");
return new verb_language_rep ();
// avoids error message when C++ compiler behaves badly
}
- Re: [TeXmacs] Re: frenchspacing?, Zoltán Kovács, 11/06/2007
- Re: [TeXmacs] Re: frenchspacing?, address@hidden, 11/07/2007
- Re: [TeXmacs] Re: frenchspacing?, Zoltán Kovács, 11/07/2007
- Re: [TeXmacs] Re: frenchspacing?, address@hidden, 11/07/2007
Archive powered by MHonArc 2.6.19.