Re: RFC: android logger feedback request
From: Geunsik Lim
Date: Wed Jan 04 2012 - 10:34:30 EST
On Thu, Dec 29, 2011 at 9:39 AM, Andrew Morton
<akpm@xxxxxxxxxxxxxxxxxxxx> wrote:
> On Wed, 21 Dec 2011 14:59:15 -0800
> Tim Bird <tim.bird@xxxxxxxxxxx> wrote:
>
>> Hi all,
>>
>> I'm looking for feedback on the Android logger code,
>
> The code looks nice.
>
>>
>> ...
>>
>> +/* logger_offset - returns index 'n' into the log via (optimized) modulus */
>> +#define logger_offset(n) Â Â ((n) & (log->size - 1))
>> +
>
> This macro depends upon the presence of a local variable called "log"
> and is therefore all stinky. ÂPass "log" in as an arg and convert it to
> a regular C function.
>
>>
>> ...
>>
>> +/*
>> + * get_entry_len - Grabs the length of the payload of the next entry starting
>> + * from 'off'.
>> + *
>> + * Caller needs to hold log->mutex.
>> + */
>> +static __u32 get_entry_len(struct logger_log *log, size_t off)
>> +{
>> + Â Â __u16 val;
>> +
>> + Â Â switch (log->size - off) {
>> + Â Â case 1:
>> + Â Â Â Â Â Â memcpy(&val, log->buffer + off, 1);
>> + Â Â Â Â Â Â memcpy(((char *) &val) + 1, log->buffer, 1);
>
> So numbers in the buffer are in host endian order. ÂThat's worth
> capturing in a comment somewhere.
>
> There must be a way of doing the above more neatly, using
> log->buffer[off] and log->buffer[0]. ÂPerhaps using
> include/linux/unaligned/packed_struct.h.
>
>> + Â Â Â Â Â Â break;
>> + Â Â default:
>> + Â Â Â Â Â Â memcpy(&val, log->buffer + off, 2);
>
> get_unaligned()
>
>> + Â Â }
>> +
>> + Â Â return sizeof(struct logger_entry) + val;
>> +}
>> +
>>
>> ...
>>
>> +static ssize_t logger_read(struct file *file, char __user *buf,
>> + Â Â Â Â Â Â Â Â Â Â Â Âsize_t count, loff_t *pos)
>> +{
>> + Â Â struct logger_reader *reader = file->private_data;
>> + Â Â struct logger_log *log = reader->log;
>> + Â Â ssize_t ret;
>> + Â Â DEFINE_WAIT(wait);
>> +
>> +start:
>> + Â Â while (1) {
>> + Â Â Â Â Â Â prepare_to_wait(&log->wq, &wait, TASK_INTERRUPTIBLE);
>> +
>> + Â Â Â Â Â Â mutex_lock(&log->mutex);
>
> If mutex_lock() had to wait for the mutex, it will return in state
> TASK_RUNNING, thus rubbing out the effects of prepare_to_wait(). ÂWe'll
> just loop again so this is a benign buglet.
>
> Could we lose a wakeup by running prepaer_to_wait() outside the lock?
> I don't think so, but I stopped thinking about it when I saw the above
> bug. ÂThese two lines should be switched around.
>
>> + Â Â Â Â Â Â ret = (log->w_off == reader->r_off);
>> + Â Â Â Â Â Â mutex_unlock(&log->mutex);
>> + Â Â Â Â Â Â if (!ret)
>> + Â Â Â Â Â Â Â Â Â Â break;
>> +
>> + Â Â Â Â Â Â if (file->f_flags & O_NONBLOCK) {
>> + Â Â Â Â Â Â Â Â Â Â ret = -EAGAIN;
>> + Â Â Â Â Â Â Â Â Â Â break;
>> + Â Â Â Â Â Â }
>> +
>> + Â Â Â Â Â Â if (signal_pending(current)) {
>> + Â Â Â Â Â Â Â Â Â Â ret = -EINTR;
>> + Â Â Â Â Â Â Â Â Â Â break;
>> + Â Â Â Â Â Â }
>> +
>> + Â Â Â Â Â Â schedule();
>> + Â Â }
>> +
>> + Â Â finish_wait(&log->wq, &wait);
>> + Â Â if (ret)
>> + Â Â Â Â Â Â return ret;
>> +
>> + Â Â mutex_lock(&log->mutex);
>> +
>> + Â Â /* is there still something to read or did we race? */
>> + Â Â if (unlikely(log->w_off == reader->r_off)) {
>> + Â Â Â Â Â Â mutex_unlock(&log->mutex);
>> + Â Â Â Â Â Â goto start;
>> + Â Â }
>> +
>> + Â Â /* get the size of the next entry */
>> + Â Â ret = get_entry_len(log, reader->r_off);
>> + Â Â if (count < ret) {
>> + Â Â Â Â Â Â ret = -EINVAL;
>> + Â Â Â Â Â Â goto out;
>> + Â Â }
>> +
>> + Â Â /* get exactly one entry from the log */
>> + Â Â ret = do_read_log_to_user(log, reader, buf, ret);
>> +
>> +out:
>> + Â Â mutex_unlock(&log->mutex);
>> +
>> + Â Â return ret;
>> +}
>> +
>>
>> ...
>>
>> +/*
>> + * clock_interval - is a < c < b in mod-space? Put another way, does the line
>> + * from a to b cross c?
>> + */
>
> This is where my little brain started to hurt. ÂI assume it's correct ;)
>
>> +static inline int clock_interval(size_t a, size_t b, size_t c)
>> +{
>> + Â Â if (b < a) {
>> + Â Â Â Â Â Â if (a < c || b >= c)
>> + Â Â Â Â Â Â Â Â Â Â return 1;
>> + Â Â } else {
>> + Â Â Â Â Â Â if (a < c && b >= c)
>> + Â Â Â Â Â Â Â Â Â Â return 1;
>> + Â Â }
>> +
>> + Â Â return 0;
>> +}
>
> The explicit inline(s) are increaseingly old-fashioned. Âgcc is good
> about this now.
>
>>
>> ...
>>
>> +static ssize_t do_write_log_from_user(struct logger_log *log,
>> + Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â const void __user *buf, size_t count)
>> +{
>> + Â Â size_t len;
>> +
>> + Â Â len = min(count, log->size - log->w_off);
>> + Â Â if (len && copy_from_user(log->buffer + log->w_off, buf, len))
>> + Â Â Â Â Â Â return -EFAULT;
>> +
>> + Â Â if (count != len)
>> + Â Â Â Â Â Â if (copy_from_user(log->buffer, buf + len, count - len))
>> + Â Â Â Â Â Â Â Â Â Â return -EFAULT;
>
> Is it correct to simply return here without updating ->w_off?
> We've just copied "len" bytes in from userspace.
>
>> + Â Â log->w_off = logger_offset(log->w_off + count);
>> +
>> + Â Â return count;
>> +}
>> +
>> +/*
>> + * logger_aio_write - our write method, implementing support for write(),
>> + * writev(), and aio_write(). Writes are our fast path, and we try to optimize
>> + * them above all else.
>> + */
>> +ssize_t logger_aio_write(struct kiocb *iocb, const struct iovec *iov,
>> + Â Â Â Â Â Â Â Â Â Â Âunsigned long nr_segs, loff_t ppos)
>> +{
>> + Â Â struct logger_log *log = file_get_log(iocb->ki_filp);
>> + Â Â size_t orig = log->w_off;
>> + Â Â struct logger_entry header;
>> + Â Â struct timespec now;
>> + Â Â ssize_t ret = 0;
>> +
>> + Â Â now = current_kernel_time();
>> +
>> + Â Â header.pid = current->tgid;
>> + Â Â header.tid = current->pid;
>
> hm, I thought task_struct.pid was the pid.
It's right.
>
> Also, pids are not unique system-wide. ÂIf the user is using PID
I think that this code is correct because current->tgid means
process id of user-space
and current->pid means thread id of user-space actually. Is it not make sense?
> namespaces then the logs will contain what may be fatally confusing duplicates.
> This needs to be fixed, I expect.
header.tid as a thread id of user-space is unique system-wide at least
although header.pid is not unqueue system-wide.
Why should we think/understand that the logs contain duplicated
information to users
who run logcat command for collecting and viewing system debug output?
Thanks.
>
> There are broader namespace issues which should be thought about. ÂDoes
> it make sense for readers in one container to be returned logs from a
> different container? ÂPerhaps the do-it-via-a-filesystem proposals can
> address this.
>
>> + Â Â header.sec = now.tv_sec;
>> + Â Â header.nsec = now.tv_nsec;
>> + Â Â header.len = min_t(size_t, iocb->ki_left, LOGGER_ENTRY_MAX_PAYLOAD);
>> +
>> + Â Â /* null writes succeed, return zero */
>> + Â Â if (unlikely(!header.len))
>> + Â Â Â Â Â Â return 0;
>> +
>> + Â Â mutex_lock(&log->mutex);
>> +
>> + Â Â /*
>> + Â Â Â* Fix up any readers, pulling them forward to the first readable
>> + Â Â Â* entry after (what will be) the new write offset. We do this now
>> + Â Â Â* because if we partially fail, we can end up with clobbered log
>> + Â Â Â* entries that encroach on readable buffer.
>> + Â Â Â*/
>> + Â Â fix_up_readers(log, sizeof(struct logger_entry) + header.len);
>> +
>> + Â Â do_write_log(log, &header, sizeof(struct logger_entry));
>> +
>> + Â Â while (nr_segs-- > 0) {
>> + Â Â Â Â Â Â size_t len;
>> + Â Â Â Â Â Â ssize_t nr;
>> +
>> + Â Â Â Â Â Â /* figure out how much of this vector we can keep */
>> + Â Â Â Â Â Â len = min_t(size_t, iov->iov_len, header.len - ret);
>> +
>> + Â Â Â Â Â Â /* write out this segment's payload */
>> + Â Â Â Â Â Â nr = do_write_log_from_user(log, iov->iov_base, len);
>> + Â Â Â Â Â Â if (unlikely(nr < 0)) {
>> + Â Â Â Â Â Â Â Â Â Â log->w_off = orig;
>> + Â Â Â Â Â Â Â Â Â Â mutex_unlock(&log->mutex);
>> + Â Â Â Â Â Â Â Â Â Â return nr;
>> + Â Â Â Â Â Â }
>> +
>> + Â Â Â Â Â Â iov++;
>> + Â Â Â Â Â Â ret += nr;
>> + Â Â }
>> +
>> + Â Â mutex_unlock(&log->mutex);
>> +
>> + Â Â /* wake up any blocked readers */
>> + Â Â wake_up_interruptible(&log->wq);
>> +
>> + Â Â return ret;
>> +}
>> +
>>
>> ...
>>
>> +static int logger_release(struct inode *ignored, struct file *file)
>> +{
>> + Â Â if (file->f_mode & FMODE_READ) {
>> + Â Â Â Â Â Â struct logger_reader *reader = file->private_data;
>> + Â Â Â Â Â Â list_del(&reader->list);
>
> locking for reader->list?
>
>> + Â Â Â Â Â Â kfree(reader);
>> + Â Â }
>> +
>> + Â Â return 0;
>> +}
>>
>> ...
>>
>> +static long logger_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
>
> ew...
>
>> +static struct logger_log *get_log_from_minor(int minor)
>> +{
>> + Â Â if (log_main.misc.minor == minor)
>> + Â Â Â Â Â Â return &log_main;
>> + Â Â if (log_events.misc.minor == minor)
>> + Â Â Â Â Â Â return &log_events;
>> + Â Â if (log_radio.misc.minor == minor)
>> + Â Â Â Â Â Â return &log_radio;
>> + Â Â if (log_system.misc.minor == minor)
>> + Â Â Â Â Â Â return &log_system;
>> + Â Â return NULL;
>> +}
>
> ew...
>
>
> --
> To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
> the body of a message to majordomo@xxxxxxxxxxxxxxx
> More majordomo info at Âhttp://vger.kernel.org/majordomo-info.html
> Please read the FAQ at Âhttp://www.tux.org/lkml/
--
Best regards,
Geunsik Lim, Samsung Electronics
Homepage: http://leemgs.fedorapeople.org
-----------------------------------------------------------------------
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at http://vger.kernel.org/majordomo-info.html
Please read the FAQ at http://www.tux.org/lkml/
-----------------------------------------------------------------------
--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at http://vger.kernel.org/majordomo-info.html
Please read the FAQ at http://www.tux.org/lkml/