Skip to content

Commit de68a7d

Browse files
dadoonetshahariaazam
authored andcommitted
Remove support for Elasticsearch v5
Closes #799.
1 parent c12dddf commit de68a7d

File tree

36 files changed

+7
-2329
lines changed

36 files changed

+7
-2329
lines changed

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ You need to install a version matching your Elasticsearch version:
1414

1515
| Elasticsearch | FS Crawler | Released | Docs |
1616
|--------------------|-------------|----------|------------------------------------------------------------------------------|
17-
| 2.x, 5.x, 6.x, 7.x | 2.7-SNAPSHOT| |[2.7-SNAPSHOT](https://fscrawler.readthedocs.io/en/latest/) |
17+
| 6.x, 7.x | 2.7-SNAPSHOT| |[2.7-SNAPSHOT](https://fscrawler.readthedocs.io/en/latest/) |
1818
| 2.x, 5.x, 6.x | 2.6 |2019-01-09|[2.6](https://fscrawler.readthedocs.io/en/fscrawler-2.6) |
1919
| 2.x, 5.x, 6.x | 2.5 |2018-08-04|[2.5](https://fscrawler.readthedocs.io/en/fscrawler-2.5) |
2020
| 2.x, 5.x, 6.x | **2.4** |2017-08-11|[2.4](https://github.com/dadoonet/fscrawler/blob/fscrawler-2.4/README.md) |

cli/src/main/java/fr/pilato/elasticsearch/crawler/fs/cli/FsCrawlerCli.java

Lines changed: 1 addition & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -251,13 +251,7 @@ public static void main(String[] args) throws Exception {
251251
try {
252252
// Let see if we want to upgrade an existing cluster to latest version
253253
if (commands.upgrade) {
254-
logger.info("Upgrading job [{}]", jobName);
255-
boolean success = fsCrawler.upgrade();
256-
if (success) {
257-
// We can rewrite the fscrawler setting file (we now have a elasticsearch.index_folder property)
258-
logger.info("Updating fscrawler setting file");
259-
fsSettingsFileHandler.write(fsSettings);
260-
}
254+
logger.info("Upgrading job [{}]. No rule implemented. Skipping.", jobName);
261255
} else {
262256
try {
263257
fsCrawler.getEsClient().start();

core/src/main/java/fr/pilato/elasticsearch/crawler/fs/FsCrawlerImpl.java

Lines changed: 0 additions & 62 deletions
Original file line numberDiff line numberDiff line change
@@ -19,8 +19,6 @@
1919

2020
package fr.pilato.elasticsearch.crawler.fs;
2121

22-
import fr.pilato.elasticsearch.crawler.fs.client.ESSearchRequest;
23-
import fr.pilato.elasticsearch.crawler.fs.client.ESSearchResponse;
2422
import fr.pilato.elasticsearch.crawler.fs.client.ElasticsearchClient;
2523
import fr.pilato.elasticsearch.crawler.fs.client.ElasticsearchClientUtil;
2624
import fr.pilato.elasticsearch.crawler.fs.framework.FsCrawlerUtil;
@@ -86,66 +84,6 @@ public ElasticsearchClient getEsClient() {
8684
return esClient;
8785
}
8886

89-
/**
90-
* Upgrade FSCrawler indices
91-
* @return true if done successfully
92-
* @throws Exception In case of error
93-
*/
94-
@SuppressWarnings("deprecation")
95-
public boolean upgrade() throws Exception {
96-
// We need to start a client so we can send requests to elasticsearch
97-
try {
98-
esClient.start();
99-
} catch (Exception t) {
100-
logger.fatal("We can not start Elasticsearch Client. Exiting.", t);
101-
return false;
102-
}
103-
104-
// The upgrade script is for now a bit dumb. It assumes that you had an old version of FSCrawler (< 2.3) and it will
105-
// simply move data from index/folder to index_folder
106-
String index = settings.getElasticsearch().getIndex();
107-
108-
// Check that the old index actually exists
109-
if (esClient.isExistingIndex(index)) {
110-
// We check that the new indices don't exist yet or are empty
111-
String indexFolder = settings.getElasticsearch().getIndexFolder();
112-
boolean indexExists = esClient.isExistingIndex(indexFolder);
113-
long numberOfDocs = 0;
114-
if (indexExists) {
115-
ESSearchResponse responseFolder = esClient.search(new ESSearchRequest().withIndex(indexFolder));
116-
numberOfDocs = responseFolder.getTotalHits();
117-
}
118-
if (numberOfDocs > 0) {
119-
logger.warn("[{}] already exists and is not empty. No upgrade needed.", indexFolder);
120-
} else {
121-
logger.debug("[{}] can be upgraded.", index);
122-
123-
// Create the new indices with the right mappings (well, we don't read existing user configuration)
124-
if (!indexExists) {
125-
esClient.createIndices();
126-
logger.info("[{}] has been created.", indexFolder);
127-
}
128-
129-
// Run reindex task for folders
130-
logger.info("Starting reindex folders...");
131-
int folders = esClient.reindex(index, INDEX_TYPE_FOLDER, indexFolder);
132-
logger.info("Done reindexing [{}] folders...", folders);
133-
134-
// Run delete by query task for folders
135-
logger.info("Starting removing folders from [{}]...", index);
136-
esClient.deleteByQuery(index, INDEX_TYPE_FOLDER);
137-
logger.info("Done removing folders from [{}]", index);
138-
139-
logger.info("You can now upgrade your elasticsearch cluster to >=6.0.0!");
140-
return true;
141-
}
142-
} else {
143-
logger.info("[{}] does not exist. No upgrade needed.", index);
144-
}
145-
146-
return false;
147-
}
148-
14987
public void start() throws Exception {
15088
logger.info("Starting FS crawler");
15189
if (loop < 0) {

distribution/es5/pom.xml

Lines changed: 0 additions & 48 deletions
This file was deleted.

distribution/es5/src/main/java/fr/pilato/elasticsearch/crawler/fs/cli/FsCrawler.java

Lines changed: 0 additions & 27 deletions
This file was deleted.

distribution/pom.xml

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@
1616
<modules>
1717
<module>es7</module>
1818
<module>es6</module>
19-
<module>es5</module>
2019
</modules>
2120

2221
<dependencies>

docs/source/conf.py

Lines changed: 0 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -50,12 +50,10 @@ def read_version(full_version=True):
5050
# The full version, including alpha/beta/rc tags.
5151
release = read_version()
5252

53-
downloadUrlV5 = "https://repo1.maven.org/maven2/fr/pilato/elasticsearch/crawler/fscrawler-es5/%s/fscrawler-es5-%s.zip" % (version, version)
5453
downloadUrlV6 = "https://repo1.maven.org/maven2/fr/pilato/elasticsearch/crawler/fscrawler-es6/%s/fscrawler-es6-%s.zip" % (version, version)
5554
downloadUrlV7 = "https://repo1.maven.org/maven2/fr/pilato/elasticsearch/crawler/fscrawler-es7/%s/fscrawler-es7-%s.zip" % (version, version)
5655

5756
if release.endswith('-SNAPSHOT'):
58-
downloadUrlV5 = "https://oss.sonatype.org/content/repositories/snapshots/fr/pilato/elasticsearch/crawler/fscrawler-es5/%s/" % release
5957
downloadUrlV6 = "https://oss.sonatype.org/content/repositories/snapshots/fr/pilato/elasticsearch/crawler/fscrawler-es6/%s/" % release
6058
downloadUrlV7 = "https://oss.sonatype.org/content/repositories/snapshots/fr/pilato/elasticsearch/crawler/fscrawler-es7/%s/" % release
6159

@@ -231,50 +229,40 @@ def read_version(full_version=True):
231229
.. |ES| replace:: Elasticsearch
232230
.. |Tika_format| replace:: Tika
233231
.. |Tika_version| replace:: Tika {fmt_tika_version}
234-
.. |ESHL_version5| replace:: Elasticsearch Rest Client {fmt_es_version5}
235232
.. |ESHL_version6| replace:: Elasticsearch Rest Client {fmt_es_version6}
236233
.. |ESHL_version7| replace:: Elasticsearch Rest Client {fmt_es_version7}
237234
.. |Levigo_version| replace:: levigo-jbig2-imageio:{fmt_levigo_version}
238235
.. |Tiff_version| replace:: jai-imageio-core:{fmt_tiff_version}
239236
.. |JPEG2000_version| replace:: jai-imageio-jpeg2000:{fmt_jpeg_version}
240-
.. |Download_URL_V5| replace:: fscrawler-es5-{fmt_release}
241237
.. |Download_URL_V6| replace:: fscrawler-es6-{fmt_release}
242238
.. |Download_URL_V7| replace:: fscrawler-es7-{fmt_release}
243-
.. |Maven_Central_V5| replace:: fscrawler-es5-*
244239
.. |Maven_Central_V6| replace:: fscrawler-es6-*
245240
.. |Maven_Central_V7| replace:: fscrawler-es7-*
246-
.. |Sonatype_V5| replace:: fscrawler-es5-*
247241
.. |Sonatype_V6| replace:: fscrawler-es6-*
248242
.. |Sonatype_V7| replace:: fscrawler-es7-*
249243
250244
.. _Tika: http://tika.apache.org/{fmt_tika_version}/
251245
.. _ES: https://www.elastic.co/products/elasticsearch
252246
.. _Tika_format: http://tika.apache.org/{fmt_tika_version}/formats.html#Supported_Document_Formats
253247
.. _Tika_version: http://tika.apache.org/{fmt_tika_version}/
254-
.. _ESHL_version5: https://www.elastic.co/guide/en/elasticsearch/client/java-rest/current/index.html
255248
.. _ESHL_version6: https://www.elastic.co/guide/en/elasticsearch/client/java-rest/current/index.html
256249
.. _ESHL_version7: https://www.elastic.co/guide/en/elasticsearch/client/java-rest/current/index.html
257250
.. _Levigo_version: http://repo1.maven.org/maven2/com/levigo/jbig2/levigo-jbig2-imageio/{fmt_levigo_version}/
258251
.. _Tiff_version: http://repo1.maven.org/maven2/com/github/jai-imageio/jai-imageio-core/{fmt_tiff_version}/
259252
.. _JPEG2000_version: http://repo1.maven.org/maven2/com/github/jai-imageio/jai-imageio-jpeg2000/{fmt_jpeg_version}/
260-
.. _Download_URL_V5: {fmt_downloadUrl_V5}
261253
.. _Download_URL_V6: {fmt_downloadUrl_V6}
262254
.. _Download_URL_V7: {fmt_downloadUrl_V7}
263-
.. _Maven_Central_V5: https://repo1.maven.org/maven2/fr/pilato/elasticsearch/crawler/fscrawler-es5/
264255
.. _Maven_Central_V6: https://repo1.maven.org/maven2/fr/pilato/elasticsearch/crawler/fscrawler-es6/
265256
.. _Maven_Central_V7: https://repo1.maven.org/maven2/fr/pilato/elasticsearch/crawler/fscrawler-es7/
266-
.. _Sonatype_V5: https://oss.sonatype.org/content/repositories/snapshots/fr/pilato/elasticsearch/crawler/fscrawler-es5/
267257
.. _Sonatype_V6: https://oss.sonatype.org/content/repositories/snapshots/fr/pilato/elasticsearch/crawler/fscrawler-es6/
268258
.. _Sonatype_V7: https://oss.sonatype.org/content/repositories/snapshots/fr/pilato/elasticsearch/crawler/fscrawler-es7/
269259
""".format(
270260
fmt_tika_version=config.get('3rdParty', 'TikaVersion'),
271-
fmt_es_version5=config.get('3rdParty', 'ElasticsearchVersion5'),
272261
fmt_es_version6=config.get('3rdParty', 'ElasticsearchVersion6'),
273262
fmt_es_version7=config.get('3rdParty', 'ElasticsearchVersion7'),
274263
fmt_levigo_version=config.get('3rdParty', 'LevigoVersion'),
275264
fmt_tiff_version=config.get('3rdParty', 'TiffVersion'),
276265
fmt_jpeg_version=config.get('3rdParty', 'JpegVersion'),
277-
fmt_downloadUrl_V5=downloadUrlV5,
278266
fmt_downloadUrl_V6=downloadUrlV6,
279267
fmt_downloadUrl_V7=downloadUrlV7,
280268
fmt_release=release

docs/source/dev/build.rst

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,6 @@ But you need first to specify the Maven profile to use and rebuild the project.
5050

5151
* ``es-7x`` for Elasticsearch 7.x
5252
* ``es-6x`` for Elasticsearch 6.x
53-
* ``es-5x`` for Elasticsearch 5.x
5453

5554

5655
Run tests with an external cluster
@@ -62,9 +61,8 @@ To run the test suite against an elasticsearch instance running locally, just ru
6261

6362
.. tip::
6463

65-
If you want to run against a version 5 or 6, run::
64+
If you want to run against a version 6, run::
6665

67-
mvn verify -pl fr.pilato.elasticsearch.crawler:fscrawler-it-v5 -Dtests.cluster.url=http://localhost:9200
6866
mvn verify -pl fr.pilato.elasticsearch.crawler:fscrawler-it-v6 -Dtests.cluster.url=http://localhost:9200
6967

7068
.. hint::

docs/source/fscrawler.ini

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,6 @@ Version=2.7-SNAPSHOT
33

44
[3rdParty]
55
TikaVersion=1.22
6-
ElasticsearchVersion5=5.6.15
76
ElasticsearchVersion6=6.8.5
87
ElasticsearchVersion7=7.4.2
98
LevigoVersion=2.0

docs/source/index.rst

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,6 @@ This crawler helps to index binary documents such as PDF, Open Office, MS Office
2424

2525
* |ESHL_version7|_ for Elasticsearch V7.
2626
* |ESHL_version6|_ for Elasticsearch V6.
27-
* |ESHL_version5|_ for Elasticsearch V5.
2827

2928
.. toctree::
3029
:caption: Installation Guide

0 commit comments

Comments
 (0)