Add SeedDMS support for office document indexing
This commit is contained in:
		
							parent
							
								
									224546c12f
								
							
						
					
					
						commit
						579f4e92e6
					
				| @ -3,7 +3,7 @@ | |||||||
| SOURCE_DIR=$(realpath $(dirname "${0}")) | SOURCE_DIR=$(realpath $(dirname "${0}")) | ||||||
| 
 | 
 | ||||||
| # Install dependencies for SeedDMS | # Install dependencies for SeedDMS | ||||||
| apt-get -y --no-install-recommends install catdoc ghostscript gnumeric id3 imagemagick php7.0-gd php7.0-fpm php7.0-mbstring php7.0-pgsql php7.0-xml php-log php-mail php-pear poppler-utils | apt-get -y --no-install-recommends install ghostscript id3 imagemagick libreoffice-calc libreoffice-writer php7.0-gd php7.0-fpm php7.0-mbstring php7.0-pgsql php7.0-xml php-log php-mail php-pear poppler-utils unoconv | ||||||
| 
 | 
 | ||||||
| # Install SeedDMS | # Install SeedDMS | ||||||
| wget https://sourceforge.net/projects/seeddms/files/seeddms-5.1.3/seeddms-quickstart-5.1.3.tar.gz/download -O /srv/seeddms.tgz | wget https://sourceforge.net/projects/seeddms/files/seeddms-5.1.3/seeddms-quickstart-5.1.3.tar.gz/download -O /srv/seeddms.tgz | ||||||
|  | |||||||
| @ -11,3 +11,5 @@ pm.max_children = 8 | |||||||
| 
 | 
 | ||||||
| php_admin_value[open_basedir] = /srv/seeddms:/tmp:/tmp:/usr/share/php | php_admin_value[open_basedir] = /srv/seeddms:/tmp:/tmp:/usr/share/php | ||||||
| php_admin_value[upload_max_filesize] = 100M | php_admin_value[upload_max_filesize] = 100M | ||||||
|  | 
 | ||||||
|  | env[LANG]=en_US.UTF-8 | ||||||
|  | |||||||
| @ -24,10 +24,16 @@ | |||||||
|         <server coreDir="" luceneClassDir="" contentOffsetDir="1048576" maxDirID="0" updateNotifyTime="86400" extraPath="/srv/seeddms/pear" cmdTimeout="5" maxExecutionTime="30"/> |         <server coreDir="" luceneClassDir="" contentOffsetDir="1048576" maxDirID="0" updateNotifyTime="86400" extraPath="/srv/seeddms/pear" cmdTimeout="5" maxExecutionTime="30"/> | ||||||
|         <converters target="fulltext"> |         <converters target="fulltext"> | ||||||
|             <converter mimeType="application/pdf">pdftotext -enc UTF-8 -nopgbrk %s - | sed -e 's/ [a-zA-Z0-9.]\{1\} / /g' -e 's/[0-9.]//g'</converter> |             <converter mimeType="application/pdf">pdftotext -enc UTF-8 -nopgbrk %s - | sed -e 's/ [a-zA-Z0-9.]\{1\} / /g' -e 's/[0-9.]//g'</converter> | ||||||
|             <converter mimeType="application/msword">catdoc %s</converter> |             <converter mimeType="text/rtf">unoconv -d document -f txt --stdout %s</converter> | ||||||
|             <converter mimeType="application/vnd.ms-excel">ssconvert -T Gnumeric_stf:stf_csv -S %s fd://1</converter> |             <converter mimeType="application/msword">unoconv -d document -f txt --stdout %s</converter> | ||||||
|  |             <converter mimeType="application/vnd.oasis.opendocument.text">unoconv -d document -f txt --stdout %s</converter> | ||||||
|  |             <converter mimeType="application/vnd.openxmlformats-officedocument.wordprocessingml.document">unoconv -d document -f txt --stdout %s</converter> | ||||||
|  |             <converter mimeType="application/vnd.ms-excel">unoconv -d spreadsheet -f csv --stdout %s</converter> | ||||||
|  |             <converter mimeType="application/vnd.oasis.opendocument.spreadsheet">unoconv -d spreadsheet -f csv --stdout %s</converter> | ||||||
|  |             <converter mimeType="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet">unoconv -d spreadsheet -f csv --stdout %s</converter> | ||||||
|             <converter mimeType="audio/mp3">id3 -l -R %s | egrep '(Title|Artist|Album)' | sed 's/^[^:]*: //g'</converter> |             <converter mimeType="audio/mp3">id3 -l -R %s | egrep '(Title|Artist|Album)' | sed 's/^[^:]*: //g'</converter> | ||||||
|             <converter mimeType="audio/mpeg">id3 -l -R %s | egrep '(Title|Artist|Album)' | sed 's/^[^:]*: //g'</converter> |             <converter mimeType="audio/mpeg">id3 -l -R %s | egrep '(Title|Artist|Album)' | sed 's/^[^:]*: //g'</converter> | ||||||
|  |             <converter mimeType="text/html">unoconv -d document -f txt --stdout %s</converter> | ||||||
|             <converter mimeType="text/plain">cat %s</converter> |             <converter mimeType="text/plain">cat %s</converter> | ||||||
|         </converters> |         </converters> | ||||||
|     </advanced> |     </advanced> | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user