To Support Unicode Characters with Solr and Tomcat, you need to have additional settings :-
<Server ...>
<Service ...>
<Connector ... URIEncoding="UTF-8"/>
...
</Connector>
</Service>
</Server>
<Server ...>
<Service ...>
<Connector ... URIEncoding="UTF-8"/>
...
</Connector>
</Service>
</Server>
http://host:port/solr/core/update?stream.body=<delete><query>*:*</query></delete>&commit=true
<delete><query>*:*</query></delete>
SolrServer server = null;
try {
server = new CommonsHttpSolrServer(masterIndexUrl);
server.deleteByQuery("*:*");
server.commit(true, true);
server.optimize(true, true);
} catch (Exception e) {
try {
server.rollback();
} catch (Exception e1) {
}
}
<field name="title" type="text" indexed="true" stored="true"/>
<field name="title_sort" type="string" indexed="true" stored="false"/>
<!-- Copy to a string type field -->
<copyField source="title" dest="title_sort" />
<!-- Fields defination -->
<field name="subject" type="text" indexed="true" stored="true"/>
<field name="subject_text" type="text" indexed="true" stored="true"/>
<field name="text" type="text" indexed="true" stored="true"/>
<!-- Copying subject field to subject_text field -->
<copyField source="subject" dest="subject_text"/>
<!-- The subject_text cannot feed into text.So you would land up with no subject being copied -->
<copyField source="subject_text" dest="text"/>
The copy is done at the stream source level and no copy feeds into another copy.