Add SeedDMS support for office document indexing
This commit is contained in:
		
							parent
							
								
									224546c12f
								
							
						
					
					
						commit
						579f4e92e6
					
				| @ -3,7 +3,7 @@ | ||||
| SOURCE_DIR=$(realpath $(dirname "${0}")) | ||||
| 
 | ||||
| # Install dependencies for SeedDMS | ||||
| apt-get -y --no-install-recommends install catdoc ghostscript gnumeric id3 imagemagick php7.0-gd php7.0-fpm php7.0-mbstring php7.0-pgsql php7.0-xml php-log php-mail php-pear poppler-utils | ||||
| apt-get -y --no-install-recommends install ghostscript id3 imagemagick libreoffice-calc libreoffice-writer php7.0-gd php7.0-fpm php7.0-mbstring php7.0-pgsql php7.0-xml php-log php-mail php-pear poppler-utils unoconv | ||||
| 
 | ||||
| # Install SeedDMS | ||||
| wget https://sourceforge.net/projects/seeddms/files/seeddms-5.1.3/seeddms-quickstart-5.1.3.tar.gz/download -O /srv/seeddms.tgz | ||||
|  | ||||
| @ -11,3 +11,5 @@ pm.max_children = 8 | ||||
| 
 | ||||
| php_admin_value[open_basedir] = /srv/seeddms:/tmp:/tmp:/usr/share/php | ||||
| php_admin_value[upload_max_filesize] = 100M | ||||
| 
 | ||||
| env[LANG]=en_US.UTF-8 | ||||
|  | ||||
| @ -24,10 +24,16 @@ | ||||
|         <server coreDir="" luceneClassDir="" contentOffsetDir="1048576" maxDirID="0" updateNotifyTime="86400" extraPath="/srv/seeddms/pear" cmdTimeout="5" maxExecutionTime="30"/> | ||||
|         <converters target="fulltext"> | ||||
|             <converter mimeType="application/pdf">pdftotext -enc UTF-8 -nopgbrk %s - | sed -e 's/ [a-zA-Z0-9.]\{1\} / /g' -e 's/[0-9.]//g'</converter> | ||||
|             <converter mimeType="application/msword">catdoc %s</converter> | ||||
|             <converter mimeType="application/vnd.ms-excel">ssconvert -T Gnumeric_stf:stf_csv -S %s fd://1</converter> | ||||
|             <converter mimeType="text/rtf">unoconv -d document -f txt --stdout %s</converter> | ||||
|             <converter mimeType="application/msword">unoconv -d document -f txt --stdout %s</converter> | ||||
|             <converter mimeType="application/vnd.oasis.opendocument.text">unoconv -d document -f txt --stdout %s</converter> | ||||
|             <converter mimeType="application/vnd.openxmlformats-officedocument.wordprocessingml.document">unoconv -d document -f txt --stdout %s</converter> | ||||
|             <converter mimeType="application/vnd.ms-excel">unoconv -d spreadsheet -f csv --stdout %s</converter> | ||||
|             <converter mimeType="application/vnd.oasis.opendocument.spreadsheet">unoconv -d spreadsheet -f csv --stdout %s</converter> | ||||
|             <converter mimeType="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet">unoconv -d spreadsheet -f csv --stdout %s</converter> | ||||
|             <converter mimeType="audio/mp3">id3 -l -R %s | egrep '(Title|Artist|Album)' | sed 's/^[^:]*: //g'</converter> | ||||
|             <converter mimeType="audio/mpeg">id3 -l -R %s | egrep '(Title|Artist|Album)' | sed 's/^[^:]*: //g'</converter> | ||||
|             <converter mimeType="text/html">unoconv -d document -f txt --stdout %s</converter> | ||||
|             <converter mimeType="text/plain">cat %s</converter> | ||||
|         </converters> | ||||
|     </advanced> | ||||
|  | ||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user