2009-05-12 02:45:00 +09:00
< ? php
/*
2009-08-26 07:14:12 +09:00
* StatusNet - the distributed open - source microblogging tool
2009-08-26 07:12:20 +09:00
* Copyright ( C ) 2008 , 2009 , StatusNet , Inc .
2009-05-12 02:45:00 +09:00
*
* This program is free software : you can redistribute it and / or modify
* it under the terms of the GNU Affero General Public License as published by
* the Free Software Foundation , either version 3 of the License , or
* ( at your option ) any later version .
*
* This program is distributed in the hope that it will be useful ,
* but WITHOUT ANY WARRANTY ; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
* GNU Affero General Public License for more details .
*
* You should have received a copy of the GNU Affero General Public License
* along with this program . If not , see < http :// www . gnu . org / licenses />.
*/
2013-11-10 22:33:45 +09:00
if ( ! defined ( 'GNUSOCIAL' )) { exit ( 1 ); }
2009-05-12 02:45:00 +09:00
/**
* Table Definition for file
*/
2011-08-23 06:52:02 +09:00
class File extends Managed_DataObject
2009-05-12 02:45:00 +09:00
{
public $__table = 'file' ; // table name
2009-06-23 06:19:41 +09:00
public $id ; // int(4) primary_key not_null
2015-02-18 02:55:12 +09:00
public $urlhash ; // varchar(64) unique_key
public $url ; // text
2015-02-25 05:11:25 +09:00
public $filehash ; // varchar(64) indexed
2009-06-23 07:48:31 +09:00
public $mimetype ; // varchar(50)
public $size ; // int(4)
2015-02-13 02:18:55 +09:00
public $title ; // varchar(191) not 255 because utf8mb4 takes more space
2009-06-23 07:48:31 +09:00
public $date ; // int(4)
public $protected ; // int(4)
2015-02-13 02:18:55 +09:00
public $filename ; // varchar(191) not 255 because utf8mb4 takes more space
2014-05-07 16:51:37 +09:00
public $width ; // int(4)
public $height ; // int(4)
2009-06-23 06:19:41 +09:00
public $modified ; // timestamp() not_null default_CURRENT_TIMESTAMP
2009-05-12 02:45:00 +09:00
2015-02-18 02:55:12 +09:00
const URLHASH_ALG = 'sha256' ;
2015-02-25 05:11:25 +09:00
const FILEHASH_ALG = 'sha256' ;
2015-02-18 02:55:12 +09:00
2011-08-23 06:52:02 +09:00
public static function schemaDef ()
{
return array (
'fields' => array (
'id' => array ( 'type' => 'serial' , 'not null' => true ),
2015-02-20 05:21:39 +09:00
'urlhash' => array ( 'type' => 'varchar' , 'length' => 64 , 'not null' => true , 'description' => 'sha256 of destination URL (url field)' ),
2015-02-20 06:06:43 +09:00
'url' => array ( 'type' => 'text' , 'description' => 'destination URL after following possible redirections' ),
2015-02-25 05:11:25 +09:00
'filehash' => array ( 'type' => 'varchar' , 'length' => 64 , 'not null' => false , 'description' => 'sha256 of the file contents, only for locally stored files of course' ),
2011-08-23 06:52:02 +09:00
'mimetype' => array ( 'type' => 'varchar' , 'length' => 50 , 'description' => 'mime type of resource' ),
'size' => array ( 'type' => 'int' , 'description' => 'size of resource when available' ),
2015-02-13 02:18:55 +09:00
'title' => array ( 'type' => 'varchar' , 'length' => 191 , 'description' => 'title of resource when available' ),
2011-08-23 06:52:02 +09:00
'date' => array ( 'type' => 'int' , 'description' => 'date of resource according to http query' ),
'protected' => array ( 'type' => 'int' , 'description' => 'true when URL is private (needs login)' ),
2015-02-13 02:18:55 +09:00
'filename' => array ( 'type' => 'varchar' , 'length' => 191 , 'description' => 'if a local file, name of the file' ),
2014-04-22 03:39:28 +09:00
'width' => array ( 'type' => 'int' , 'description' => 'width in pixels, if it can be described as such and data is available' ),
'height' => array ( 'type' => 'int' , 'description' => 'height in pixels, if it can be described as such and data is available' ),
2011-08-23 06:52:02 +09:00
'modified' => array ( 'type' => 'timestamp' , 'not null' => true , 'description' => 'date this record was modified' ),
),
'primary key' => array ( 'id' ),
'unique keys' => array (
2015-02-18 02:55:12 +09:00
'file_urlhash_key' => array ( 'urlhash' ),
2011-08-23 06:52:02 +09:00
),
2015-02-25 05:11:25 +09:00
'indexes' => array (
'file_filehash_idx' => array ( 'filehash' ),
),
2011-08-23 06:52:02 +09:00
);
}
2009-05-14 03:27:32 +09:00
function isProtected ( $url ) {
return 'http://www.facebook.com/login.php' === $url ;
}
2010-03-11 06:39:42 +09:00
/**
* Save a new file record .
*
* @ param array $redir_data lookup data eg from File_redirection :: where ()
* @ param string $given_url
* @ return File
*/
2015-09-27 19:29:38 +09:00
public static function saveNew ( array $redir_data , $given_url )
{
$file = null ;
try {
// I don't know why we have to keep doing this but we run a last check to avoid
// uniqueness bugs.
$file = File :: getByUrl ( $given_url );
2015-10-02 05:14:49 +09:00
return $file ;
2015-09-27 19:29:38 +09:00
} catch ( NoResultException $e ) {
2015-10-02 05:14:49 +09:00
// We don't have the file's URL since before, so let's continue.
}
$file = new File ;
$file -> url = $given_url ;
if ( ! empty ( $redir_data [ 'protected' ])) $file -> protected = $redir_data [ 'protected' ];
if ( ! empty ( $redir_data [ 'title' ])) $file -> title = $redir_data [ 'title' ];
if ( ! empty ( $redir_data [ 'type' ])) $file -> mimetype = $redir_data [ 'type' ];
if ( ! empty ( $redir_data [ 'size' ])) $file -> size = intval ( $redir_data [ 'size' ]);
if ( isset ( $redir_data [ 'time' ]) && $redir_data [ 'time' ] > 0 ) $file -> date = intval ( $redir_data [ 'time' ]);
2015-11-02 14:15:08 +09:00
$file -> saveFile ();
return $file ;
}
public function saveFile () {
$this -> urlhash = self :: hashurl ( $this -> url );
2015-10-02 05:14:49 +09:00
2015-11-02 14:15:08 +09:00
if ( ! Event :: handle ( 'StartFileSaveNew' , array ( & $this ))) {
throw new ServerException ( 'File not saved due to an aborted StartFileSaveNew event.' );
}
$this -> id = $this -> insert ();
if ( $this -> id === false ) {
2015-10-02 05:14:49 +09:00
throw new ServerException ( 'File/URL metadata could not be saved to the database.' );
2011-10-01 02:03:42 +09:00
}
2009-05-14 03:27:32 +09:00
2015-11-02 14:15:08 +09:00
Event :: handle ( 'EndFileSaveNew' , array ( $this ));
2009-05-14 03:27:32 +09:00
}
2010-05-26 05:09:21 +09:00
/**
2010-11-16 04:00:42 +09:00
* Go look at a URL and possibly save data about it if it ' s new :
* - follow redirect chains and store them in file_redirection
* - if a thumbnail is available , save it in file_thumbnail
* - save file record with basic info
* - optionally save a file_to_post record
* - return the File object with the full reference
*
* @ param string $given_url the URL we ' re looking at
2015-06-05 00:36:11 +09:00
* @ param Notice $notice ( optional )
2010-11-16 04:00:42 +09:00
* @ param bool $followRedirects defaults to true
*
* @ return mixed File on success , - 1 on some errors
*
2014-06-02 09:08:48 +09:00
* @ throws ServerException on failure
2010-05-26 05:09:21 +09:00
*/
2015-06-05 00:36:11 +09:00
public static function processNew ( $given_url , Notice $notice = null , $followRedirects = true ) {
2014-06-02 09:08:48 +09:00
if ( empty ( $given_url )) {
throw new ServerException ( 'No given URL to process' );
}
2009-05-14 03:27:32 +09:00
$given_url = File_redirection :: _canonUrl ( $given_url );
2014-06-02 09:08:48 +09:00
if ( empty ( $given_url )) {
throw new ServerException ( 'No canonical URL from given URL to process' );
}
2015-11-02 14:15:08 +09:00
$redir = File_redirection :: where ( $given_url );
$file = $redir -> getFile ();
2014-06-02 09:08:48 +09:00
2015-02-20 03:29:55 +09:00
// If we still don't have a File object, let's create one now!
2015-11-02 14:15:08 +09:00
if ( empty ( $file -> id )) {
if ( $redir -> url === $given_url || ! $followRedirects ) {
2015-02-20 03:29:55 +09:00
// Save the File object based on our lookup trace
2015-11-02 14:15:08 +09:00
$file -> saveFile ();
2015-02-20 03:29:55 +09:00
} else {
2015-11-02 14:15:08 +09:00
$file -> saveFile ();
$redir -> file_id = $file -> id ;
$redir -> insert ();
2009-05-14 03:27:32 +09:00
}
2015-11-02 14:15:08 +09:00
}
2009-05-14 03:27:32 +09:00
2015-11-02 14:15:08 +09:00
if ( ! $file instanceof File || empty ( $file -> id )) {
// This should not happen
throw new ServerException ( 'URL processing failed without new File object' );
2009-05-14 03:27:32 +09:00
}
2009-06-23 07:48:31 +09:00
2015-06-05 00:36:11 +09:00
if ( $notice instanceof Notice ) {
File_to_post :: processNew ( $file , $notice );
2009-08-28 12:23:31 +09:00
}
2015-11-02 14:15:08 +09:00
2014-06-02 09:08:48 +09:00
return $file ;
2009-05-14 03:27:32 +09:00
}
2009-06-01 10:03:55 +09:00
2013-10-06 01:43:41 +09:00
public static function respectsQuota ( Profile $scoped , $fileSize ) {
2009-07-08 04:55:10 +09:00
if ( $fileSize > common_config ( 'attachments' , 'file_quota' )) {
2011-12-28 20:44:42 +09:00
// TRANS: Message used to be inserted as %2$s in the text "No file may
// TRANS: be larger than %1$d byte and the file you sent was %2$s.".
// TRANS: %1$d is the number of bytes of an uploaded file.
$fileSizeText = sprintf ( _m ( '%1$d byte' , '%1$d bytes' , $fileSize ), $fileSize );
$fileQuota = common_config ( 'attachments' , 'file_quota' );
2010-07-29 20:01:04 +09:00
// TRANS: Message given if an upload is larger than the configured maximum.
2011-12-28 20:44:42 +09:00
// TRANS: %1$d (used for plural) is the byte limit for uploads,
// TRANS: %2$s is the proper form of "n bytes". This is the only ways to have
// TRANS: gettext support multiple plurals in the same message, unfortunately...
2013-10-06 01:43:41 +09:00
throw new ClientException (
sprintf ( _m ( 'No file may be larger than %1$d byte and the file you sent was %2$s. Try to upload a smaller version.' ,
2011-12-28 20:44:42 +09:00
'No file may be larger than %1$d bytes and the file you sent was %2$s. Try to upload a smaller version.' ,
$fileQuota ),
2013-10-06 01:43:41 +09:00
$fileQuota , $fileSizeText ));
2009-06-01 10:03:55 +09:00
}
2013-10-06 01:43:41 +09:00
$file = new File ;
$query = " select sum(size) as total from file join file_to_post on file_to_post.file_id = file.id join notice on file_to_post.post_id = notice.id where profile_id = { $scoped -> id } and file.url like '%/notice/%/file' " ;
$file -> query ( $query );
$file -> fetch ();
$total = $file -> total + $fileSize ;
2009-06-01 10:03:55 +09:00
if ( $total > common_config ( 'attachments' , 'user_quota' )) {
2010-07-29 20:01:04 +09:00
// TRANS: Message given if an upload would exceed user quota.
2010-11-05 02:33:39 +09:00
// TRANS: %d (number) is the user quota in bytes and is used for plural.
2013-10-06 01:43:41 +09:00
throw new ClientException (
sprintf ( _m ( 'A file this large would exceed your user quota of %d byte.' ,
2010-11-05 02:33:39 +09:00
'A file this large would exceed your user quota of %d bytes.' ,
common_config ( 'attachments' , 'user_quota' )),
2013-10-06 01:43:41 +09:00
common_config ( 'attachments' , 'user_quota' )));
2009-06-01 10:03:55 +09:00
}
2009-07-22 14:05:44 +09:00
$query .= ' AND EXTRACT(month FROM file.modified) = EXTRACT(month FROM now()) and EXTRACT(year FROM file.modified) = EXTRACT(year FROM now())' ;
2013-10-06 01:43:41 +09:00
$file -> query ( $query );
$file -> fetch ();
$total = $file -> total + $fileSize ;
2009-06-01 10:03:55 +09:00
if ( $total > common_config ( 'attachments' , 'monthly_quota' )) {
2010-07-29 20:01:04 +09:00
// TRANS: Message given id an upload would exceed a user's monthly quota.
2010-11-05 02:33:39 +09:00
// TRANS: $d (number) is the monthly user quota in bytes and is used for plural.
2013-10-06 01:43:41 +09:00
throw new ClientException (
sprintf ( _m ( 'A file this large would exceed your monthly quota of %d byte.' ,
2010-11-05 02:33:39 +09:00
'A file this large would exceed your monthly quota of %d bytes.' ,
common_config ( 'attachments' , 'monthly_quota' )),
2013-10-06 01:43:41 +09:00
common_config ( 'attachments' , 'monthly_quota' )));
2009-06-01 10:03:55 +09:00
}
return true ;
}
2009-06-23 07:48:31 +09:00
2015-05-30 22:41:04 +09:00
public function getFilename ()
{
if ( ! self :: validFilename ( $this -> filename )) {
// TRANS: Client exception thrown if a file upload does not have a valid name.
throw new ClientException ( _ ( " Invalid filename. " ));
}
return $this -> filename ;
}
2009-06-23 07:48:31 +09:00
// where should the file go?
2014-04-17 06:17:27 +09:00
static function filename ( Profile $profile , $origname , $mimetype )
2009-06-23 23:29:43 +09:00
{
2015-02-25 05:11:25 +09:00
$ext = self :: guessMimeExtension ( $mimetype );
2010-11-04 09:05:26 +09:00
2014-04-17 06:17:27 +09:00
// Normalize and make the original filename more URL friendly.
2014-06-23 00:03:27 +09:00
$origname = basename ( $origname , " . $ext " );
2014-04-17 06:17:27 +09:00
if ( class_exists ( 'Normalizer' )) {
// http://php.net/manual/en/class.normalizer.php
// http://www.unicode.org/reports/tr15/
$origname = Normalizer :: normalize ( $origname , Normalizer :: FORM_KC );
}
$origname = preg_replace ( '/[^A-Za-z0-9\.\_]/' , '_' , $origname );
2014-06-23 00:03:27 +09:00
$nickname = $profile -> getNickname ();
2014-04-17 06:17:27 +09:00
$datestamp = strftime ( '%Y%m%d' , time ());
do {
// generate new random strings until we don't run into a filename collision.
$random = strtolower ( common_confirmation_code ( 16 ));
$filename = " $nickname - $datestamp - $origname - $random . $ext " ;
} while ( file_exists ( self :: path ( $filename )));
return $filename ;
2009-06-23 23:29:43 +09:00
}
2009-06-23 07:48:31 +09:00
2015-02-25 05:11:25 +09:00
static function guessMimeExtension ( $mimetype )
{
try {
$ext = common_supported_mime_to_ext ( $mimetype );
} catch ( Exception $e ) {
// We don't support this mimetype, but let's guess the extension
$ext = substr ( strrchr ( $mimetype , '/' ), 1 );
}
return strtolower ( $ext );
}
2010-02-02 01:48:31 +09:00
/**
* Validation for as - saved base filenames
*/
static function validFilename ( $filename )
{
2010-02-03 02:30:15 +09:00
return preg_match ( '/^[A-Za-z0-9._-]+$/' , $filename );
2010-02-02 01:48:31 +09:00
}
/**
* @ throws ClientException on invalid filename
*/
2009-06-23 23:29:43 +09:00
static function path ( $filename )
{
2010-02-02 01:48:31 +09:00
if ( ! self :: validFilename ( $filename )) {
2010-07-29 20:01:04 +09:00
// TRANS: Client exception thrown if a file upload does not have a valid name.
throw new ClientException ( _ ( " Invalid filename. " ));
2010-02-02 01:48:31 +09:00
}
2009-06-23 23:29:43 +09:00
$dir = common_config ( 'attachments' , 'dir' );
2009-06-23 07:48:31 +09:00
2009-06-23 23:29:43 +09:00
if ( $dir [ strlen ( $dir ) - 1 ] != '/' ) {
$dir .= '/' ;
}
2009-06-23 07:48:31 +09:00
2009-06-23 23:29:43 +09:00
return $dir . $filename ;
}
2009-06-23 07:48:31 +09:00
2009-06-23 23:29:43 +09:00
static function url ( $filename )
{
2010-02-02 01:48:31 +09:00
if ( ! self :: validFilename ( $filename )) {
2010-07-29 20:01:04 +09:00
// TRANS: Client exception thrown if a file upload does not have a valid name.
throw new ClientException ( _ ( " Invalid filename. " ));
2010-02-02 01:48:31 +09:00
}
2010-10-15 03:22:17 +09:00
if ( common_config ( 'site' , 'private' )) {
2009-06-23 07:48:31 +09:00
2010-01-06 07:47:37 +09:00
return common_local_url ( 'getfile' ,
array ( 'filename' => $filename ));
2009-06-23 07:48:31 +09:00
2010-10-15 03:22:17 +09:00
}
2009-06-23 07:48:31 +09:00
2015-02-27 20:44:15 +09:00
if ( GNUsocial :: useHTTPS ()) {
2010-10-15 03:22:17 +09:00
$sslserver = common_config ( 'attachments' , 'sslserver' );
2009-06-23 07:48:31 +09:00
2010-10-15 03:22:17 +09:00
if ( empty ( $sslserver )) {
// XXX: this assumes that background dir == site dir + /file/
// not true if there's another server
if ( is_string ( common_config ( 'site' , 'sslserver' )) &&
mb_strlen ( common_config ( 'site' , 'sslserver' )) > 0 ) {
$server = common_config ( 'site' , 'sslserver' );
} else if ( common_config ( 'site' , 'server' )) {
$server = common_config ( 'site' , 'server' );
}
$path = common_config ( 'site' , 'path' ) . '/file/' ;
} else {
$server = $sslserver ;
$path = common_config ( 'attachments' , 'sslpath' );
if ( empty ( $path )) {
$path = common_config ( 'attachments' , 'path' );
}
2010-01-06 07:47:37 +09:00
}
2010-10-15 03:22:17 +09:00
$protocol = 'https' ;
} else {
$path = common_config ( 'attachments' , 'path' );
2010-01-06 07:47:37 +09:00
$server = common_config ( 'attachments' , 'server' );
2009-06-23 07:48:31 +09:00
2010-01-06 07:47:37 +09:00
if ( empty ( $server )) {
$server = common_config ( 'site' , 'server' );
}
2009-06-23 07:48:31 +09:00
2010-02-12 07:06:57 +09:00
$ssl = common_config ( 'attachments' , 'ssl' );
2010-01-06 07:47:37 +09:00
2010-02-12 07:06:57 +09:00
$protocol = ( $ssl ) ? 'https' : 'http' ;
2010-10-15 03:22:17 +09:00
}
2010-02-12 07:06:57 +09:00
2010-10-15 03:22:17 +09:00
if ( $path [ strlen ( $path ) - 1 ] != '/' ) {
$path .= '/' ;
2010-01-06 07:47:37 +09:00
}
2010-10-15 03:22:17 +09:00
if ( $path [ 0 ] != '/' ) {
$path = '/' . $path ;
}
return $protocol . '://' . $server . $path . $filename ;
2009-06-23 23:29:43 +09:00
}
2009-07-15 02:33:40 +09:00
2009-08-27 04:40:51 +09:00
function getEnclosure (){
$enclosure = ( object ) array ();
2014-08-05 17:54:00 +09:00
foreach ( array ( 'title' , 'url' , 'date' , 'modified' , 'size' , 'mimetype' ) as $key ) {
$enclosure -> $key = $this -> $key ;
}
2014-10-20 23:21:42 +09:00
$needMoreMetadataMimetypes = array ( null , 'application/xhtml+xml' );
2014-08-05 17:54:00 +09:00
if ( ! isset ( $this -> filename ) && in_array ( common_bare_mime ( $enclosure -> mimetype ), $needMoreMetadataMimetypes )) {
// This fetches enclosure metadata for non-local links with unset/HTML mimetypes,
// which may be enriched through oEmbed or similar (implemented as plugins)
Event :: handle ( 'FileEnclosureMetadata' , array ( $this , & $enclosure ));
2009-07-15 02:33:40 +09:00
}
2014-08-05 17:54:00 +09:00
if ( empty ( $enclosure -> mimetype ) || in_array ( common_bare_mime ( $enclosure -> mimetype ), $needMoreMetadataMimetypes )) {
// This means we either don't know what it is, so it can't
// be shown as an enclosure, or it is an HTML link which
// does not link to a resource with further metadata.
2014-06-02 08:26:23 +09:00
throw new ServerException ( 'Unknown enclosure mimetype, not enough metadata' );
}
2009-08-27 10:51:54 +09:00
return $enclosure ;
2009-07-15 02:33:40 +09:00
}
2010-03-03 09:30:09 +09:00
2010-11-09 10:22:01 +09:00
/**
* Get the attachment ' s thumbnail record , if any .
2014-04-22 03:39:28 +09:00
* Make sure you supply proper 'int' typed variables ( or null ) .
2010-11-09 10:22:01 +09:00
*
2014-04-22 03:39:28 +09:00
* @ param $width int Max width of thumbnail in pixels . ( if null , use common_config values )
* @ param $height int Max height of thumbnail in pixels . ( if null , square - crop to $width )
* @ param $crop bool Crop to the max - values ' aspect ratio
2014-04-21 18:35:42 +09:00
*
2010-11-09 10:22:01 +09:00
* @ return File_thumbnail
2015-02-25 23:13:47 +09:00
*
* @ throws UseFileAsThumbnailException if the file is considered an image itself and should be itself as thumbnail
* @ throws UnsupportedMediaException if , despite trying , we can ' t understand how to make a thumbnail for this format
* @ throws ServerException on various other errors
2010-11-09 10:22:01 +09:00
*/
2015-01-27 00:33:39 +09:00
public function getThumbnail ( $width = null , $height = null , $crop = false , $force_still = true )
2010-11-09 10:22:01 +09:00
{
2015-01-26 06:45:25 +09:00
// Get some more information about this file through our ImageFile class
$image = ImageFile :: fromFileObject ( $this );
2015-01-27 00:33:39 +09:00
if ( $image -> animated && ! common_config ( 'thumbnail' , 'animated' )) {
// null means "always use file as thumbnail"
// false means you get choice between frozen frame or original when calling getThumbnail
if ( is_null ( common_config ( 'thumbnail' , 'animated' )) || ! $force_still ) {
throw new UseFileAsThumbnailException ( $this -> id );
}
2015-01-26 06:45:25 +09:00
}
2015-03-04 21:12:42 +09:00
return $image -> getFileThumbnail ( $width , $height , $crop );
2014-04-22 03:39:28 +09:00
}
2014-04-17 02:14:26 +09:00
public function getPath ()
{
2015-02-25 05:11:25 +09:00
$filepath = self :: path ( $this -> filename );
if ( ! file_exists ( $filepath )) {
throw new FileNotFoundException ( $filepath );
}
return $filepath ;
2014-04-17 02:14:26 +09:00
}
2015-01-13 03:22:10 +09:00
2014-04-17 06:17:27 +09:00
public function getUrl ()
{
2015-01-13 03:22:10 +09:00
if ( ! empty ( $this -> filename )) {
// A locally stored file, so let's generate a URL for our instance.
$url = self :: url ( $this -> filename );
2015-02-20 03:07:43 +09:00
if ( self :: hashurl ( $url ) !== $this -> urlhash ) {
2015-01-13 03:22:10 +09:00
// For indexing purposes, in case we do a lookup on the 'url' field.
// also we're fixing possible changes from http to https, or paths
$this -> updateUrl ( $url );
}
return $url ;
}
// No local filename available, return the URL we have stored
2014-04-17 06:17:27 +09:00
return $this -> url ;
}
2014-04-17 02:14:26 +09:00
2015-02-20 02:34:48 +09:00
static public function getByUrl ( $url )
{
$file = new File ();
$file -> urlhash = self :: hashurl ( $url );
if ( ! $file -> find ( true )) {
throw new NoResultException ( $file );
}
return $file ;
}
2015-02-25 05:11:25 +09:00
/**
* @ param string $hashstr String of ( preferrably lower case ) hexadecimal characters , same as result of 'hash_file(...)'
*/
2015-10-02 05:14:49 +09:00
static public function getByHash ( $hashstr )
2015-02-25 05:11:25 +09:00
{
$file = new File ();
$file -> filehash = strtolower ( $hashstr );
if ( ! $file -> find ( true )) {
throw new NoResultException ( $file );
}
return $file ;
}
2015-01-13 03:22:10 +09:00
public function updateUrl ( $url )
{
2015-02-18 02:55:12 +09:00
$file = File :: getKV ( 'urlhash' , self :: hashurl ( $url ));
2015-01-13 03:22:10 +09:00
if ( $file instanceof File ) {
throw new ServerException ( 'URL already exists in DB' );
}
2015-02-18 02:55:12 +09:00
$sql = 'UPDATE %1$s SET urlhash=%2$s, url=%3$s WHERE urlhash=%4$s;' ;
2015-06-07 02:35:10 +09:00
$result = $this -> query ( sprintf ( $sql , $this -> tableName (),
2015-02-18 02:55:12 +09:00
$this -> _quote (( string ) self :: hashurl ( $url )),
2015-01-13 03:22:10 +09:00
$this -> _quote (( string ) $url ),
2015-02-18 02:55:12 +09:00
$this -> _quote (( string ) $this -> urlhash )));
2015-01-13 03:22:10 +09:00
if ( $result === false ) {
common_log_db_error ( $this , 'UPDATE' , __FILE__ );
2015-06-07 02:35:10 +09:00
throw new ServerException ( " Could not UPDATE { $this -> tableName () } .url " );
2015-01-13 03:22:10 +09:00
}
return $result ;
}
2010-12-29 05:57:31 +09:00
/**
* Blow the cache of notices that link to this URL
*
* @ param boolean $last Whether to blow the " last " cache too
*
* @ return void
*/
2010-12-29 04:58:55 +09:00
function blowCache ( $last = false )
{
2015-06-05 00:02:45 +09:00
self :: blow ( 'file:notice-ids:%s' , $this -> id );
2010-12-29 04:58:55 +09:00
if ( $last ) {
2015-06-05 00:02:45 +09:00
self :: blow ( 'file:notice-ids:%s;last' , $this -> id );
2010-12-29 04:58:55 +09:00
}
2010-12-29 06:44:49 +09:00
self :: blow ( 'file:notice-count:%d' , $this -> id );
2010-12-29 04:58:55 +09:00
}
/**
* Stream of notices linking to this URL
*
* @ param integer $offset Offset to show ; default is 0
* @ param integer $limit Limit of notices to show
* @ param integer $since_id Since this notice
* @ param integer $max_id Before this notice
*
* @ return array ids of notices that link to this file
*/
function stream ( $offset = 0 , $limit = NOTICES_PER_PAGE , $since_id = 0 , $max_id = 0 )
{
2011-03-25 07:04:19 +09:00
$stream = new FileNoticeStream ( $this );
2011-03-24 00:29:55 +09:00
return $stream -> getNotices ( $offset , $limit , $since_id , $max_id );
2010-12-29 04:58:55 +09:00
}
2010-12-29 06:44:49 +09:00
function noticeCount ()
{
$cacheKey = sprintf ( 'file:notice-count:%d' , $this -> id );
$count = self :: cacheGet ( $cacheKey );
if ( $count === false ) {
$f2p = new File_to_post ();
$f2p -> file_id = $this -> id ;
$count = $f2p -> count ();
self :: cacheSet ( $cacheKey , $count );
}
return $count ;
}
2014-05-12 21:33:41 +09:00
public function isLocal ()
{
return ! empty ( $this -> filename );
}
2014-05-12 22:16:41 +09:00
public function delete ( $useWhere = false )
{
// Delete the file, if it exists locally
if ( ! empty ( $this -> filename ) && file_exists ( self :: path ( $this -> filename ))) {
$deleted = @ unlink ( self :: path ( $this -> filename ));
if ( ! $deleted ) {
common_log ( LOG_ERR , sprintf ( 'Could not unlink existing file: "%s"' , self :: path ( $this -> filename )));
}
}
// Clear out related things in the database and filesystem, such as thumbnails
if ( Event :: handle ( 'FileDeleteRelated' , array ( $this ))) {
$thumbs = new File_thumbnail ();
$thumbs -> file_id = $this -> id ;
if ( $thumbs -> find ()) {
while ( $thumbs -> fetch ()) {
$thumbs -> delete ();
}
}
2015-04-16 06:25:12 +09:00
$f2p = new File_to_post ();
$f2p -> file_id = $this -> id ;
if ( $f2p -> find ()) {
while ( $f2p -> fetch ()) {
$f2p -> delete ();
}
}
2014-05-12 22:16:41 +09:00
}
// And finally remove the entry from the database
return parent :: delete ( $useWhere );
}
2014-08-05 18:30:45 +09:00
public function getTitle ()
{
$title = $this -> title ? : $this -> filename ;
return $title ? : null ;
}
2015-02-18 02:55:12 +09:00
static public function hashurl ( $url )
{
if ( empty ( $url )) {
throw new Exception ( 'No URL provided to hash algorithm.' );
}
return hash ( self :: URLHASH_ALG , $url );
}
2015-02-20 02:59:28 +09:00
static public function beforeSchemaUpdate ()
{
$table = strtolower ( get_called_class ());
$schema = Schema :: get ();
$schemadef = $schema -> getTableDef ( $table );
// 2015-02-19 We have to upgrade our table definitions to have the urlhash field populated
2015-02-20 03:36:59 +09:00
if ( isset ( $schemadef [ 'fields' ][ 'urlhash' ]) && isset ( $schemadef [ 'unique keys' ][ 'file_urlhash_key' ])) {
2015-02-20 02:59:28 +09:00
// We already have the urlhash field, so no need to migrate it.
return ;
}
2015-02-20 03:40:36 +09:00
echo " \n Found old $table table, upgrading it to contain 'urlhash' field... " ;
2015-05-28 04:31:29 +09:00
$file = new File ();
$file -> query ( sprintf ( 'SELECT id, LEFT(url, 191) AS shortenedurl, COUNT(*) AS c FROM %1$s WHERE LENGTH(url)>191 GROUP BY shortenedurl HAVING c > 1' , $schema -> quoteIdentifier ( $table )));
print " \n Found { $file -> N } URLs with too long entries in file table \n " ;
while ( $file -> fetch ()) {
// We've got a URL that is too long for our future file table
// so we'll cut it. We could save the original URL, but there is
// no guarantee it is complete anyway since the previous max was 255 chars.
$dupfile = new File ();
// First we find file entries that would be duplicates of this when shortened
// ... and we'll just throw the dupes out the window for now! It's already so borken.
$dupfile -> query ( sprintf ( 'SELECT * FROM file WHERE LEFT(url, 191) = "%1$s"' , $file -> shortenedurl ));
// Leave one of the URLs in the database by using ->find(true) (fetches first entry)
if ( $dupfile -> find ( true )) {
print " \n Shortening url entry for $table id: { $file -> id } [ " ;
$orig = clone ( $dupfile );
$dupfile -> url = $file -> shortenedurl ; // make sure it's only 191 chars from now on
$dupfile -> update ( $orig );
print " \n Deleting duplicate entries of too long URL on $table id: { $file -> id } [ " ;
// only start deleting with this fetch.
while ( $dupfile -> fetch ()) {
print " . " ;
$dupfile -> delete ();
}
print " ] \n " ;
} else {
print " \n Warning! URL suddenly disappeared from database: { $file -> url } \n " ;
}
}
2015-05-28 04:54:51 +09:00
echo " ...and now all the non-duplicates which are longer than 191 characters... \n " ;
$file -> query ( 'UPDATE file SET url=LEFT(url, 191) WHERE LENGTH(url)>191' );
2015-05-28 04:31:29 +09:00
echo " \n ...now running hacky pre-schemaupdate change for $table : " ;
2015-02-20 02:59:28 +09:00
// We have to create a urlhash that is _not_ the primary key,
// transfer data and THEN run checkSchema
$schemadef [ 'fields' ][ 'urlhash' ] = array (
'type' => 'varchar' ,
'length' => 64 ,
2015-05-28 05:37:20 +09:00
'not null' => false , // this is because when adding column, all entries will _be_ NULL!
2015-02-20 06:06:43 +09:00
'description' => 'sha256 of destination URL (url field)' ,
2015-02-20 02:59:28 +09:00
);
2015-02-20 06:06:43 +09:00
$schemadef [ 'fields' ][ 'url' ] = array (
'type' => 'text' ,
'description' => 'destination URL after following possible redirections' ,
);
unset ( $schemadef [ 'unique keys' ]);
2015-02-20 02:59:28 +09:00
$schema -> ensureTable ( $table , $schemadef );
echo " DONE. \n " ;
$classname = ucfirst ( $table );
$tablefix = new $classname ;
// urlhash is hash('sha256', $url) in the File table
2015-02-20 03:40:36 +09:00
echo " Updating urlhash fields in $table table... " ;
2015-02-20 02:59:28 +09:00
// Maybe very MySQL specific :(
$tablefix -> query ( sprintf ( 'UPDATE %1$s SET %2$s=%3$s;' ,
$schema -> quoteIdentifier ( $table ),
'urlhash' ,
// The line below is "result of sha256 on column `url`"
'SHA2(url, 256)' ));
echo " DONE. \n " ;
echo " Resuming core schema upgrade... " ;
}
2009-05-12 02:45:00 +09:00
}